2018-11-11 Richard Biener <rguenther@suse.de>
[official-gcc.git] / gcc / cfgexpand.c
blob8fa392fcd8adf931649295351756850204812bc1
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2018 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "params.h"
65 #include "tree-inline.h"
66 #include "value-prof.h"
67 #include "tree-ssa-live.h"
68 #include "tree-outof-ssa.h"
69 #include "cfgloop.h"
70 #include "insn-attr.h" /* For INSN_SCHEDULING. */
71 #include "stringpool.h"
72 #include "attribs.h"
73 #include "asan.h"
74 #include "tree-ssa-address.h"
75 #include "output.h"
76 #include "builtins.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 enum gimple_rhs_class grhs_class;
109 grhs_class = get_gimple_rhs_class (gimple_expr_code (stmt));
111 if (grhs_class == GIMPLE_TERNARY_RHS)
112 t = build3 (gimple_assign_rhs_code (stmt),
113 TREE_TYPE (gimple_assign_lhs (stmt)),
114 gimple_assign_rhs1 (stmt),
115 gimple_assign_rhs2 (stmt),
116 gimple_assign_rhs3 (stmt));
117 else if (grhs_class == GIMPLE_BINARY_RHS)
118 t = build2 (gimple_assign_rhs_code (stmt),
119 TREE_TYPE (gimple_assign_lhs (stmt)),
120 gimple_assign_rhs1 (stmt),
121 gimple_assign_rhs2 (stmt));
122 else if (grhs_class == GIMPLE_UNARY_RHS)
123 t = build1 (gimple_assign_rhs_code (stmt),
124 TREE_TYPE (gimple_assign_lhs (stmt)),
125 gimple_assign_rhs1 (stmt));
126 else if (grhs_class == GIMPLE_SINGLE_RHS)
128 t = gimple_assign_rhs1 (stmt);
129 /* Avoid modifying this tree in place below. */
130 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
131 && gimple_location (stmt) != EXPR_LOCATION (t))
132 || (gimple_block (stmt)
133 && currently_expanding_to_rtl
134 && EXPR_P (t)))
135 t = copy_node (t);
137 else
138 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 struct stack_var
310 /* The Variable. */
311 tree decl;
313 /* Initially, the size of the variable. Later, the size of the partition,
314 if this variable becomes it's partition's representative. */
315 poly_uint64 size;
317 /* The *byte* alignment required for this variable. Or as, with the
318 size, the alignment for this partition. */
319 unsigned int alignb;
321 /* The partition representative. */
322 size_t representative;
324 /* The next stack variable in the partition, or EOC. */
325 size_t next;
327 /* The numbers of conflicting stack variables. */
328 bitmap conflicts;
331 #define EOC ((size_t)-1)
333 /* We have an array of such objects while deciding allocation. */
334 static struct stack_var *stack_vars;
335 static size_t stack_vars_alloc;
336 static size_t stack_vars_num;
337 static hash_map<tree, size_t> *decl_to_stack_part;
339 /* Conflict bitmaps go on this obstack. This allows us to destroy
340 all of them in one big sweep. */
341 static bitmap_obstack stack_var_bitmap_obstack;
343 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
344 is non-decreasing. */
345 static size_t *stack_vars_sorted;
347 /* The phase of the stack frame. This is the known misalignment of
348 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
349 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
350 static int frame_phase;
352 /* Used during expand_used_vars to remember if we saw any decls for
353 which we'd like to enable stack smashing protection. */
354 static bool has_protected_decls;
356 /* Used during expand_used_vars. Remember if we say a character buffer
357 smaller than our cutoff threshold. Used for -Wstack-protector. */
358 static bool has_short_buffer;
360 /* Compute the byte alignment to use for DECL. Ignore alignment
361 we can't do with expected alignment of the stack boundary. */
363 static unsigned int
364 align_local_variable (tree decl)
366 unsigned int align;
368 if (TREE_CODE (decl) == SSA_NAME)
369 align = TYPE_ALIGN (TREE_TYPE (decl));
370 else
372 align = LOCAL_DECL_ALIGNMENT (decl);
373 SET_DECL_ALIGN (decl, align);
375 return align / BITS_PER_UNIT;
378 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
379 down otherwise. Return truncated BASE value. */
381 static inline unsigned HOST_WIDE_INT
382 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
384 return align_up ? (base + align - 1) & -align : base & -align;
387 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
388 Return the frame offset. */
390 static poly_int64
391 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
393 poly_int64 offset, new_frame_offset;
395 if (FRAME_GROWS_DOWNWARD)
397 new_frame_offset
398 = aligned_lower_bound (frame_offset - frame_phase - size,
399 align) + frame_phase;
400 offset = new_frame_offset;
402 else
404 new_frame_offset
405 = aligned_upper_bound (frame_offset - frame_phase,
406 align) + frame_phase;
407 offset = new_frame_offset;
408 new_frame_offset += size;
410 frame_offset = new_frame_offset;
412 if (frame_offset_overflow (frame_offset, cfun->decl))
413 frame_offset = offset = 0;
415 return offset;
418 /* Accumulate DECL into STACK_VARS. */
420 static void
421 add_stack_var (tree decl)
423 struct stack_var *v;
425 if (stack_vars_num >= stack_vars_alloc)
427 if (stack_vars_alloc)
428 stack_vars_alloc = stack_vars_alloc * 3 / 2;
429 else
430 stack_vars_alloc = 32;
431 stack_vars
432 = XRESIZEVEC (struct stack_var, stack_vars, stack_vars_alloc);
434 if (!decl_to_stack_part)
435 decl_to_stack_part = new hash_map<tree, size_t>;
437 v = &stack_vars[stack_vars_num];
438 decl_to_stack_part->put (decl, stack_vars_num);
440 v->decl = decl;
441 tree size = TREE_CODE (decl) == SSA_NAME
442 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
443 : DECL_SIZE_UNIT (decl);
444 v->size = tree_to_poly_uint64 (size);
445 /* Ensure that all variables have size, so that &a != &b for any two
446 variables that are simultaneously live. */
447 if (known_eq (v->size, 0U))
448 v->size = 1;
449 v->alignb = align_local_variable (decl);
450 /* An alignment of zero can mightily confuse us later. */
451 gcc_assert (v->alignb != 0);
453 /* All variables are initially in their own partition. */
454 v->representative = stack_vars_num;
455 v->next = EOC;
457 /* All variables initially conflict with no other. */
458 v->conflicts = NULL;
460 /* Ensure that this decl doesn't get put onto the list twice. */
461 set_rtl (decl, pc_rtx);
463 stack_vars_num++;
466 /* Make the decls associated with luid's X and Y conflict. */
468 static void
469 add_stack_var_conflict (size_t x, size_t y)
471 struct stack_var *a = &stack_vars[x];
472 struct stack_var *b = &stack_vars[y];
473 if (!a->conflicts)
474 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
475 if (!b->conflicts)
476 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
477 bitmap_set_bit (a->conflicts, y);
478 bitmap_set_bit (b->conflicts, x);
481 /* Check whether the decls associated with luid's X and Y conflict. */
483 static bool
484 stack_var_conflict_p (size_t x, size_t y)
486 struct stack_var *a = &stack_vars[x];
487 struct stack_var *b = &stack_vars[y];
488 if (x == y)
489 return false;
490 /* Partitions containing an SSA name result from gimple registers
491 with things like unsupported modes. They are top-level and
492 hence conflict with everything else. */
493 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
494 return true;
496 if (!a->conflicts || !b->conflicts)
497 return false;
498 return bitmap_bit_p (a->conflicts, y);
501 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
502 enter its partition number into bitmap DATA. */
504 static bool
505 visit_op (gimple *, tree op, tree, void *data)
507 bitmap active = (bitmap)data;
508 op = get_base_address (op);
509 if (op
510 && DECL_P (op)
511 && DECL_RTL_IF_SET (op) == pc_rtx)
513 size_t *v = decl_to_stack_part->get (op);
514 if (v)
515 bitmap_set_bit (active, *v);
517 return false;
520 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
521 record conflicts between it and all currently active other partitions
522 from bitmap DATA. */
524 static bool
525 visit_conflict (gimple *, tree op, tree, void *data)
527 bitmap active = (bitmap)data;
528 op = get_base_address (op);
529 if (op
530 && DECL_P (op)
531 && DECL_RTL_IF_SET (op) == pc_rtx)
533 size_t *v = decl_to_stack_part->get (op);
534 if (v && bitmap_set_bit (active, *v))
536 size_t num = *v;
537 bitmap_iterator bi;
538 unsigned i;
539 gcc_assert (num < stack_vars_num);
540 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
541 add_stack_var_conflict (num, i);
544 return false;
547 /* Helper routine for add_scope_conflicts, calculating the active partitions
548 at the end of BB, leaving the result in WORK. We're called to generate
549 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
550 liveness. */
552 static void
553 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
555 edge e;
556 edge_iterator ei;
557 gimple_stmt_iterator gsi;
558 walk_stmt_load_store_addr_fn visit;
560 bitmap_clear (work);
561 FOR_EACH_EDGE (e, ei, bb->preds)
562 bitmap_ior_into (work, (bitmap)e->src->aux);
564 visit = visit_op;
566 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
568 gimple *stmt = gsi_stmt (gsi);
569 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
571 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
573 gimple *stmt = gsi_stmt (gsi);
575 if (gimple_clobber_p (stmt))
577 tree lhs = gimple_assign_lhs (stmt);
578 size_t *v;
579 /* Nested function lowering might introduce LHSs
580 that are COMPONENT_REFs. */
581 if (!VAR_P (lhs))
582 continue;
583 if (DECL_RTL_IF_SET (lhs) == pc_rtx
584 && (v = decl_to_stack_part->get (lhs)))
585 bitmap_clear_bit (work, *v);
587 else if (!is_gimple_debug (stmt))
589 if (for_conflict
590 && visit == visit_op)
592 /* If this is the first real instruction in this BB we need
593 to add conflicts for everything live at this point now.
594 Unlike classical liveness for named objects we can't
595 rely on seeing a def/use of the names we're interested in.
596 There might merely be indirect loads/stores. We'd not add any
597 conflicts for such partitions. */
598 bitmap_iterator bi;
599 unsigned i;
600 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
602 struct stack_var *a = &stack_vars[i];
603 if (!a->conflicts)
604 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
605 bitmap_ior_into (a->conflicts, work);
607 visit = visit_conflict;
609 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
614 /* Generate stack partition conflicts between all partitions that are
615 simultaneously live. */
617 static void
618 add_scope_conflicts (void)
620 basic_block bb;
621 bool changed;
622 bitmap work = BITMAP_ALLOC (NULL);
623 int *rpo;
624 int n_bbs;
626 /* We approximate the live range of a stack variable by taking the first
627 mention of its name as starting point(s), and by the end-of-scope
628 death clobber added by gimplify as ending point(s) of the range.
629 This overapproximates in the case we for instance moved an address-taken
630 operation upward, without also moving a dereference to it upwards.
631 But it's conservatively correct as a variable never can hold values
632 before its name is mentioned at least once.
634 We then do a mostly classical bitmap liveness algorithm. */
636 FOR_ALL_BB_FN (bb, cfun)
637 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
639 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
640 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
642 changed = true;
643 while (changed)
645 int i;
646 changed = false;
647 for (i = 0; i < n_bbs; i++)
649 bitmap active;
650 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
651 active = (bitmap)bb->aux;
652 add_scope_conflicts_1 (bb, work, false);
653 if (bitmap_ior_into (active, work))
654 changed = true;
658 FOR_EACH_BB_FN (bb, cfun)
659 add_scope_conflicts_1 (bb, work, true);
661 free (rpo);
662 BITMAP_FREE (work);
663 FOR_ALL_BB_FN (bb, cfun)
664 BITMAP_FREE (bb->aux);
667 /* A subroutine of partition_stack_vars. A comparison function for qsort,
668 sorting an array of indices by the properties of the object. */
670 static int
671 stack_var_cmp (const void *a, const void *b)
673 size_t ia = *(const size_t *)a;
674 size_t ib = *(const size_t *)b;
675 unsigned int aligna = stack_vars[ia].alignb;
676 unsigned int alignb = stack_vars[ib].alignb;
677 poly_int64 sizea = stack_vars[ia].size;
678 poly_int64 sizeb = stack_vars[ib].size;
679 tree decla = stack_vars[ia].decl;
680 tree declb = stack_vars[ib].decl;
681 bool largea, largeb;
682 unsigned int uida, uidb;
684 /* Primary compare on "large" alignment. Large comes first. */
685 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
686 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
687 if (largea != largeb)
688 return (int)largeb - (int)largea;
690 /* Secondary compare on size, decreasing */
691 int diff = compare_sizes_for_sort (sizeb, sizea);
692 if (diff != 0)
693 return diff;
695 /* Tertiary compare on true alignment, decreasing. */
696 if (aligna < alignb)
697 return -1;
698 if (aligna > alignb)
699 return 1;
701 /* Final compare on ID for sort stability, increasing.
702 Two SSA names are compared by their version, SSA names come before
703 non-SSA names, and two normal decls are compared by their DECL_UID. */
704 if (TREE_CODE (decla) == SSA_NAME)
706 if (TREE_CODE (declb) == SSA_NAME)
707 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
708 else
709 return -1;
711 else if (TREE_CODE (declb) == SSA_NAME)
712 return 1;
713 else
714 uida = DECL_UID (decla), uidb = DECL_UID (declb);
715 if (uida < uidb)
716 return 1;
717 if (uida > uidb)
718 return -1;
719 return 0;
722 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
723 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
725 /* If the points-to solution *PI points to variables that are in a partition
726 together with other variables add all partition members to the pointed-to
727 variables bitmap. */
729 static void
730 add_partitioned_vars_to_ptset (struct pt_solution *pt,
731 part_hashmap *decls_to_partitions,
732 hash_set<bitmap> *visited, bitmap temp)
734 bitmap_iterator bi;
735 unsigned i;
736 bitmap *part;
738 if (pt->anything
739 || pt->vars == NULL
740 /* The pointed-to vars bitmap is shared, it is enough to
741 visit it once. */
742 || visited->add (pt->vars))
743 return;
745 bitmap_clear (temp);
747 /* By using a temporary bitmap to store all members of the partitions
748 we have to add we make sure to visit each of the partitions only
749 once. */
750 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
751 if ((!temp
752 || !bitmap_bit_p (temp, i))
753 && (part = decls_to_partitions->get (i)))
754 bitmap_ior_into (temp, *part);
755 if (!bitmap_empty_p (temp))
756 bitmap_ior_into (pt->vars, temp);
759 /* Update points-to sets based on partition info, so we can use them on RTL.
760 The bitmaps representing stack partitions will be saved until expand,
761 where partitioned decls used as bases in memory expressions will be
762 rewritten. */
764 static void
765 update_alias_info_with_stack_vars (void)
767 part_hashmap *decls_to_partitions = NULL;
768 size_t i, j;
769 tree var = NULL_TREE;
771 for (i = 0; i < stack_vars_num; i++)
773 bitmap part = NULL;
774 tree name;
775 struct ptr_info_def *pi;
777 /* Not interested in partitions with single variable. */
778 if (stack_vars[i].representative != i
779 || stack_vars[i].next == EOC)
780 continue;
782 if (!decls_to_partitions)
784 decls_to_partitions = new part_hashmap;
785 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
788 /* Create an SSA_NAME that points to the partition for use
789 as base during alias-oracle queries on RTL for bases that
790 have been partitioned. */
791 if (var == NULL_TREE)
792 var = create_tmp_var (ptr_type_node);
793 name = make_ssa_name (var);
795 /* Create bitmaps representing partitions. They will be used for
796 points-to sets later, so use GGC alloc. */
797 part = BITMAP_GGC_ALLOC ();
798 for (j = i; j != EOC; j = stack_vars[j].next)
800 tree decl = stack_vars[j].decl;
801 unsigned int uid = DECL_PT_UID (decl);
802 bitmap_set_bit (part, uid);
803 decls_to_partitions->put (uid, part);
804 cfun->gimple_df->decls_to_pointers->put (decl, name);
805 if (TREE_ADDRESSABLE (decl))
806 TREE_ADDRESSABLE (name) = 1;
809 /* Make the SSA name point to all partition members. */
810 pi = get_ptr_info (name);
811 pt_solution_set (&pi->pt, part, false);
814 /* Make all points-to sets that contain one member of a partition
815 contain all members of the partition. */
816 if (decls_to_partitions)
818 unsigned i;
819 tree name;
820 hash_set<bitmap> visited;
821 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
823 FOR_EACH_SSA_NAME (i, name, cfun)
825 struct ptr_info_def *pi;
827 if (POINTER_TYPE_P (TREE_TYPE (name))
828 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
829 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
830 &visited, temp);
833 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
834 decls_to_partitions, &visited, temp);
836 delete decls_to_partitions;
837 BITMAP_FREE (temp);
841 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
842 partitioning algorithm. Partitions A and B are known to be non-conflicting.
843 Merge them into a single partition A. */
845 static void
846 union_stack_vars (size_t a, size_t b)
848 struct stack_var *vb = &stack_vars[b];
849 bitmap_iterator bi;
850 unsigned u;
852 gcc_assert (stack_vars[b].next == EOC);
853 /* Add B to A's partition. */
854 stack_vars[b].next = stack_vars[a].next;
855 stack_vars[b].representative = a;
856 stack_vars[a].next = b;
858 /* Update the required alignment of partition A to account for B. */
859 if (stack_vars[a].alignb < stack_vars[b].alignb)
860 stack_vars[a].alignb = stack_vars[b].alignb;
862 /* Update the interference graph and merge the conflicts. */
863 if (vb->conflicts)
865 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
866 add_stack_var_conflict (a, stack_vars[u].representative);
867 BITMAP_FREE (vb->conflicts);
871 /* A subroutine of expand_used_vars. Binpack the variables into
872 partitions constrained by the interference graph. The overall
873 algorithm used is as follows:
875 Sort the objects by size in descending order.
876 For each object A {
877 S = size(A)
878 O = 0
879 loop {
880 Look for the largest non-conflicting object B with size <= S.
881 UNION (A, B)
886 static void
887 partition_stack_vars (void)
889 size_t si, sj, n = stack_vars_num;
891 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
892 for (si = 0; si < n; ++si)
893 stack_vars_sorted[si] = si;
895 if (n == 1)
896 return;
898 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
900 for (si = 0; si < n; ++si)
902 size_t i = stack_vars_sorted[si];
903 unsigned int ialign = stack_vars[i].alignb;
904 poly_int64 isize = stack_vars[i].size;
906 /* Ignore objects that aren't partition representatives. If we
907 see a var that is not a partition representative, it must
908 have been merged earlier. */
909 if (stack_vars[i].representative != i)
910 continue;
912 for (sj = si + 1; sj < n; ++sj)
914 size_t j = stack_vars_sorted[sj];
915 unsigned int jalign = stack_vars[j].alignb;
916 poly_int64 jsize = stack_vars[j].size;
918 /* Ignore objects that aren't partition representatives. */
919 if (stack_vars[j].representative != j)
920 continue;
922 /* Do not mix objects of "small" (supported) alignment
923 and "large" (unsupported) alignment. */
924 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
925 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
926 break;
928 /* For Address Sanitizer do not mix objects with different
929 sizes, as the shorter vars wouldn't be adequately protected.
930 Don't do that for "large" (unsupported) alignment objects,
931 those aren't protected anyway. */
932 if (asan_sanitize_stack_p ()
933 && maybe_ne (isize, jsize)
934 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
935 break;
937 /* Ignore conflicting objects. */
938 if (stack_var_conflict_p (i, j))
939 continue;
941 /* UNION the objects, placing J at OFFSET. */
942 union_stack_vars (i, j);
946 update_alias_info_with_stack_vars ();
949 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
951 static void
952 dump_stack_var_partition (void)
954 size_t si, i, j, n = stack_vars_num;
956 for (si = 0; si < n; ++si)
958 i = stack_vars_sorted[si];
960 /* Skip variables that aren't partition representatives, for now. */
961 if (stack_vars[i].representative != i)
962 continue;
964 fprintf (dump_file, "Partition %lu: size ", (unsigned long) i);
965 print_dec (stack_vars[i].size, dump_file);
966 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
968 for (j = i; j != EOC; j = stack_vars[j].next)
970 fputc ('\t', dump_file);
971 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
973 fputc ('\n', dump_file);
977 /* Assign rtl to DECL at BASE + OFFSET. */
979 static void
980 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
981 poly_int64 offset)
983 unsigned align;
984 rtx x;
986 /* If this fails, we've overflowed the stack frame. Error nicely? */
987 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
989 x = plus_constant (Pmode, base, offset);
990 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
991 ? TYPE_MODE (TREE_TYPE (decl))
992 : DECL_MODE (SSAVAR (decl)), x);
994 if (TREE_CODE (decl) != SSA_NAME)
996 /* Set alignment we actually gave this decl if it isn't an SSA name.
997 If it is we generate stack slots only accidentally so it isn't as
998 important, we'll simply use the alignment that is already set. */
999 if (base == virtual_stack_vars_rtx)
1000 offset -= frame_phase;
1001 align = known_alignment (offset);
1002 align *= BITS_PER_UNIT;
1003 if (align == 0 || align > base_align)
1004 align = base_align;
1006 /* One would think that we could assert that we're not decreasing
1007 alignment here, but (at least) the i386 port does exactly this
1008 via the MINIMUM_ALIGNMENT hook. */
1010 SET_DECL_ALIGN (decl, align);
1011 DECL_USER_ALIGN (decl) = 0;
1014 set_rtl (decl, x);
1017 struct stack_vars_data
1019 /* Vector of offset pairs, always end of some padding followed
1020 by start of the padding that needs Address Sanitizer protection.
1021 The vector is in reversed, highest offset pairs come first. */
1022 auto_vec<HOST_WIDE_INT> asan_vec;
1024 /* Vector of partition representative decls in between the paddings. */
1025 auto_vec<tree> asan_decl_vec;
1027 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1028 rtx asan_base;
1030 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1031 unsigned int asan_alignb;
1034 /* A subroutine of expand_used_vars. Give each partition representative
1035 a unique location within the stack frame. Update each partition member
1036 with that location. */
1038 static void
1039 expand_stack_vars (bool (*pred) (size_t), struct stack_vars_data *data)
1041 size_t si, i, j, n = stack_vars_num;
1042 poly_uint64 large_size = 0, large_alloc = 0;
1043 rtx large_base = NULL;
1044 unsigned large_align = 0;
1045 bool large_allocation_done = false;
1046 tree decl;
1048 /* Determine if there are any variables requiring "large" alignment.
1049 Since these are dynamically allocated, we only process these if
1050 no predicate involved. */
1051 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1052 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1054 /* Find the total size of these variables. */
1055 for (si = 0; si < n; ++si)
1057 unsigned alignb;
1059 i = stack_vars_sorted[si];
1060 alignb = stack_vars[i].alignb;
1062 /* All "large" alignment decls come before all "small" alignment
1063 decls, but "large" alignment decls are not sorted based on
1064 their alignment. Increase large_align to track the largest
1065 required alignment. */
1066 if ((alignb * BITS_PER_UNIT) > large_align)
1067 large_align = alignb * BITS_PER_UNIT;
1069 /* Stop when we get to the first decl with "small" alignment. */
1070 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1071 break;
1073 /* Skip variables that aren't partition representatives. */
1074 if (stack_vars[i].representative != i)
1075 continue;
1077 /* Skip variables that have already had rtl assigned. See also
1078 add_stack_var where we perpetrate this pc_rtx hack. */
1079 decl = stack_vars[i].decl;
1080 if (TREE_CODE (decl) == SSA_NAME
1081 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1082 : DECL_RTL (decl) != pc_rtx)
1083 continue;
1085 large_size = aligned_upper_bound (large_size, alignb);
1086 large_size += stack_vars[i].size;
1090 for (si = 0; si < n; ++si)
1092 rtx base;
1093 unsigned base_align, alignb;
1094 poly_int64 offset;
1096 i = stack_vars_sorted[si];
1098 /* Skip variables that aren't partition representatives, for now. */
1099 if (stack_vars[i].representative != i)
1100 continue;
1102 /* Skip variables that have already had rtl assigned. See also
1103 add_stack_var where we perpetrate this pc_rtx hack. */
1104 decl = stack_vars[i].decl;
1105 if (TREE_CODE (decl) == SSA_NAME
1106 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1107 : DECL_RTL (decl) != pc_rtx)
1108 continue;
1110 /* Check the predicate to see whether this variable should be
1111 allocated in this pass. */
1112 if (pred && !pred (i))
1113 continue;
1115 alignb = stack_vars[i].alignb;
1116 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1118 base = virtual_stack_vars_rtx;
1119 /* ASAN description strings don't yet have a syntax for expressing
1120 polynomial offsets. */
1121 HOST_WIDE_INT prev_offset;
1122 if (asan_sanitize_stack_p ()
1123 && pred
1124 && frame_offset.is_constant (&prev_offset)
1125 && stack_vars[i].size.is_constant ())
1127 prev_offset = align_base (prev_offset,
1128 MAX (alignb, ASAN_RED_ZONE_SIZE),
1129 !FRAME_GROWS_DOWNWARD);
1130 tree repr_decl = NULL_TREE;
1131 offset
1132 = alloc_stack_frame_space (stack_vars[i].size
1133 + ASAN_RED_ZONE_SIZE,
1134 MAX (alignb, ASAN_RED_ZONE_SIZE));
1136 data->asan_vec.safe_push (prev_offset);
1137 /* Allocating a constant amount of space from a constant
1138 starting offset must give a constant result. */
1139 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1140 .to_constant ());
1141 /* Find best representative of the partition.
1142 Prefer those with DECL_NAME, even better
1143 satisfying asan_protect_stack_decl predicate. */
1144 for (j = i; j != EOC; j = stack_vars[j].next)
1145 if (asan_protect_stack_decl (stack_vars[j].decl)
1146 && DECL_NAME (stack_vars[j].decl))
1148 repr_decl = stack_vars[j].decl;
1149 break;
1151 else if (repr_decl == NULL_TREE
1152 && DECL_P (stack_vars[j].decl)
1153 && DECL_NAME (stack_vars[j].decl))
1154 repr_decl = stack_vars[j].decl;
1155 if (repr_decl == NULL_TREE)
1156 repr_decl = stack_vars[i].decl;
1157 data->asan_decl_vec.safe_push (repr_decl);
1159 /* Make sure a representative is unpoison if another
1160 variable in the partition is handled by
1161 use-after-scope sanitization. */
1162 if (asan_handled_variables != NULL
1163 && !asan_handled_variables->contains (repr_decl))
1165 for (j = i; j != EOC; j = stack_vars[j].next)
1166 if (asan_handled_variables->contains (stack_vars[j].decl))
1167 break;
1168 if (j != EOC)
1169 asan_handled_variables->add (repr_decl);
1172 data->asan_alignb = MAX (data->asan_alignb, alignb);
1173 if (data->asan_base == NULL)
1174 data->asan_base = gen_reg_rtx (Pmode);
1175 base = data->asan_base;
1177 if (!STRICT_ALIGNMENT)
1178 base_align = crtl->max_used_stack_slot_alignment;
1179 else
1180 base_align = MAX (crtl->max_used_stack_slot_alignment,
1181 GET_MODE_ALIGNMENT (SImode)
1182 << ASAN_SHADOW_SHIFT);
1184 else
1186 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1187 base_align = crtl->max_used_stack_slot_alignment;
1190 else
1192 /* Large alignment is only processed in the last pass. */
1193 if (pred)
1194 continue;
1196 /* If there were any variables requiring "large" alignment, allocate
1197 space. */
1198 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1200 poly_int64 loffset;
1201 rtx large_allocsize;
1203 large_allocsize = gen_int_mode (large_size, Pmode);
1204 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1205 loffset = alloc_stack_frame_space
1206 (rtx_to_poly_int64 (large_allocsize),
1207 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1208 large_base = get_dynamic_stack_base (loffset, large_align);
1209 large_allocation_done = true;
1211 gcc_assert (large_base != NULL);
1213 large_alloc = aligned_upper_bound (large_alloc, alignb);
1214 offset = large_alloc;
1215 large_alloc += stack_vars[i].size;
1217 base = large_base;
1218 base_align = large_align;
1221 /* Create rtl for each variable based on their location within the
1222 partition. */
1223 for (j = i; j != EOC; j = stack_vars[j].next)
1225 expand_one_stack_var_at (stack_vars[j].decl,
1226 base, base_align,
1227 offset);
1231 gcc_assert (known_eq (large_alloc, large_size));
1234 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1235 static poly_uint64
1236 account_stack_vars (void)
1238 size_t si, j, i, n = stack_vars_num;
1239 poly_uint64 size = 0;
1241 for (si = 0; si < n; ++si)
1243 i = stack_vars_sorted[si];
1245 /* Skip variables that aren't partition representatives, for now. */
1246 if (stack_vars[i].representative != i)
1247 continue;
1249 size += stack_vars[i].size;
1250 for (j = i; j != EOC; j = stack_vars[j].next)
1251 set_rtl (stack_vars[j].decl, NULL);
1253 return size;
1256 /* Record the RTL assignment X for the default def of PARM. */
1258 extern void
1259 set_parm_rtl (tree parm, rtx x)
1261 gcc_assert (TREE_CODE (parm) == PARM_DECL
1262 || TREE_CODE (parm) == RESULT_DECL);
1264 if (x && !MEM_P (x))
1266 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1267 TYPE_MODE (TREE_TYPE (parm)),
1268 TYPE_ALIGN (TREE_TYPE (parm)));
1270 /* If the variable alignment is very large we'll dynamicaly
1271 allocate it, which means that in-frame portion is just a
1272 pointer. ??? We've got a pseudo for sure here, do we
1273 actually dynamically allocate its spilling area if needed?
1274 ??? Isn't it a problem when Pmode alignment also exceeds
1275 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1276 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1277 align = GET_MODE_ALIGNMENT (Pmode);
1279 record_alignment_for_reg_var (align);
1282 tree ssa = ssa_default_def (cfun, parm);
1283 if (!ssa)
1284 return set_rtl (parm, x);
1286 int part = var_to_partition (SA.map, ssa);
1287 gcc_assert (part != NO_PARTITION);
1289 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1290 gcc_assert (changed);
1292 set_rtl (ssa, x);
1293 gcc_assert (DECL_RTL (parm) == x);
1296 /* A subroutine of expand_one_var. Called to immediately assign rtl
1297 to a variable to be allocated in the stack frame. */
1299 static void
1300 expand_one_stack_var_1 (tree var)
1302 poly_uint64 size;
1303 poly_int64 offset;
1304 unsigned byte_align;
1306 if (TREE_CODE (var) == SSA_NAME)
1308 tree type = TREE_TYPE (var);
1309 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1310 byte_align = TYPE_ALIGN_UNIT (type);
1312 else
1314 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1315 byte_align = align_local_variable (var);
1318 /* We handle highly aligned variables in expand_stack_vars. */
1319 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1321 offset = alloc_stack_frame_space (size, byte_align);
1323 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1324 crtl->max_used_stack_slot_alignment, offset);
1327 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1328 already assigned some MEM. */
1330 static void
1331 expand_one_stack_var (tree var)
1333 if (TREE_CODE (var) == SSA_NAME)
1335 int part = var_to_partition (SA.map, var);
1336 if (part != NO_PARTITION)
1338 rtx x = SA.partition_to_pseudo[part];
1339 gcc_assert (x);
1340 gcc_assert (MEM_P (x));
1341 return;
1345 return expand_one_stack_var_1 (var);
1348 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1349 that will reside in a hard register. */
1351 static void
1352 expand_one_hard_reg_var (tree var)
1354 rest_of_decl_compilation (var, 0, 0);
1357 /* Record the alignment requirements of some variable assigned to a
1358 pseudo. */
1360 static void
1361 record_alignment_for_reg_var (unsigned int align)
1363 if (SUPPORTS_STACK_ALIGNMENT
1364 && crtl->stack_alignment_estimated < align)
1366 /* stack_alignment_estimated shouldn't change after stack
1367 realign decision made */
1368 gcc_assert (!crtl->stack_realign_processed);
1369 crtl->stack_alignment_estimated = align;
1372 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1373 So here we only make sure stack_alignment_needed >= align. */
1374 if (crtl->stack_alignment_needed < align)
1375 crtl->stack_alignment_needed = align;
1376 if (crtl->max_used_stack_slot_alignment < align)
1377 crtl->max_used_stack_slot_alignment = align;
1380 /* Create RTL for an SSA partition. */
1382 static void
1383 expand_one_ssa_partition (tree var)
1385 int part = var_to_partition (SA.map, var);
1386 gcc_assert (part != NO_PARTITION);
1388 if (SA.partition_to_pseudo[part])
1389 return;
1391 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1392 TYPE_MODE (TREE_TYPE (var)),
1393 TYPE_ALIGN (TREE_TYPE (var)));
1395 /* If the variable alignment is very large we'll dynamicaly allocate
1396 it, which means that in-frame portion is just a pointer. */
1397 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1398 align = GET_MODE_ALIGNMENT (Pmode);
1400 record_alignment_for_reg_var (align);
1402 if (!use_register_for_decl (var))
1404 if (defer_stack_allocation (var, true))
1405 add_stack_var (var);
1406 else
1407 expand_one_stack_var_1 (var);
1408 return;
1411 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1412 rtx x = gen_reg_rtx (reg_mode);
1414 set_rtl (var, x);
1416 /* For a promoted variable, X will not be used directly but wrapped in a
1417 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1418 will assume that its upper bits can be inferred from its lower bits.
1419 Therefore, if X isn't initialized on every path from the entry, then
1420 we must do it manually in order to fulfill the above assumption. */
1421 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1422 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1423 emit_move_insn (x, CONST0_RTX (reg_mode));
1426 /* Record the association between the RTL generated for partition PART
1427 and the underlying variable of the SSA_NAME VAR. */
1429 static void
1430 adjust_one_expanded_partition_var (tree var)
1432 if (!var)
1433 return;
1435 tree decl = SSA_NAME_VAR (var);
1437 int part = var_to_partition (SA.map, var);
1438 if (part == NO_PARTITION)
1439 return;
1441 rtx x = SA.partition_to_pseudo[part];
1443 gcc_assert (x);
1445 set_rtl (var, x);
1447 if (!REG_P (x))
1448 return;
1450 /* Note if the object is a user variable. */
1451 if (decl && !DECL_ARTIFICIAL (decl))
1452 mark_user_reg (x);
1454 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1455 mark_reg_pointer (x, get_pointer_alignment (var));
1458 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1459 that will reside in a pseudo register. */
1461 static void
1462 expand_one_register_var (tree var)
1464 if (TREE_CODE (var) == SSA_NAME)
1466 int part = var_to_partition (SA.map, var);
1467 if (part != NO_PARTITION)
1469 rtx x = SA.partition_to_pseudo[part];
1470 gcc_assert (x);
1471 gcc_assert (REG_P (x));
1472 return;
1474 gcc_unreachable ();
1477 tree decl = var;
1478 tree type = TREE_TYPE (decl);
1479 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1480 rtx x = gen_reg_rtx (reg_mode);
1482 set_rtl (var, x);
1484 /* Note if the object is a user variable. */
1485 if (!DECL_ARTIFICIAL (decl))
1486 mark_user_reg (x);
1488 if (POINTER_TYPE_P (type))
1489 mark_reg_pointer (x, get_pointer_alignment (var));
1492 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1493 has some associated error, e.g. its type is error-mark. We just need
1494 to pick something that won't crash the rest of the compiler. */
1496 static void
1497 expand_one_error_var (tree var)
1499 machine_mode mode = DECL_MODE (var);
1500 rtx x;
1502 if (mode == BLKmode)
1503 x = gen_rtx_MEM (BLKmode, const0_rtx);
1504 else if (mode == VOIDmode)
1505 x = const0_rtx;
1506 else
1507 x = gen_reg_rtx (mode);
1509 SET_DECL_RTL (var, x);
1512 /* A subroutine of expand_one_var. VAR is a variable that will be
1513 allocated to the local stack frame. Return true if we wish to
1514 add VAR to STACK_VARS so that it will be coalesced with other
1515 variables. Return false to allocate VAR immediately.
1517 This function is used to reduce the number of variables considered
1518 for coalescing, which reduces the size of the quadratic problem. */
1520 static bool
1521 defer_stack_allocation (tree var, bool toplevel)
1523 tree size_unit = TREE_CODE (var) == SSA_NAME
1524 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1525 : DECL_SIZE_UNIT (var);
1526 poly_uint64 size;
1528 /* Whether the variable is small enough for immediate allocation not to be
1529 a problem with regard to the frame size. */
1530 bool smallish
1531 = (poly_int_tree_p (size_unit, &size)
1532 && (estimated_poly_value (size)
1533 < PARAM_VALUE (PARAM_MIN_SIZE_FOR_STACK_SHARING)));
1535 /* If stack protection is enabled, *all* stack variables must be deferred,
1536 so that we can re-order the strings to the top of the frame.
1537 Similarly for Address Sanitizer. */
1538 if (flag_stack_protect || asan_sanitize_stack_p ())
1539 return true;
1541 unsigned int align = TREE_CODE (var) == SSA_NAME
1542 ? TYPE_ALIGN (TREE_TYPE (var))
1543 : DECL_ALIGN (var);
1545 /* We handle "large" alignment via dynamic allocation. We want to handle
1546 this extra complication in only one place, so defer them. */
1547 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1548 return true;
1550 bool ignored = TREE_CODE (var) == SSA_NAME
1551 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1552 : DECL_IGNORED_P (var);
1554 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1555 might be detached from their block and appear at toplevel when we reach
1556 here. We want to coalesce them with variables from other blocks when
1557 the immediate contribution to the frame size would be noticeable. */
1558 if (toplevel && optimize > 0 && ignored && !smallish)
1559 return true;
1561 /* Variables declared in the outermost scope automatically conflict
1562 with every other variable. The only reason to want to defer them
1563 at all is that, after sorting, we can more efficiently pack
1564 small variables in the stack frame. Continue to defer at -O2. */
1565 if (toplevel && optimize < 2)
1566 return false;
1568 /* Without optimization, *most* variables are allocated from the
1569 stack, which makes the quadratic problem large exactly when we
1570 want compilation to proceed as quickly as possible. On the
1571 other hand, we don't want the function's stack frame size to
1572 get completely out of hand. So we avoid adding scalars and
1573 "small" aggregates to the list at all. */
1574 if (optimize == 0 && smallish)
1575 return false;
1577 return true;
1580 /* A subroutine of expand_used_vars. Expand one variable according to
1581 its flavor. Variables to be placed on the stack are not actually
1582 expanded yet, merely recorded.
1583 When REALLY_EXPAND is false, only add stack values to be allocated.
1584 Return stack usage this variable is supposed to take.
1587 static poly_uint64
1588 expand_one_var (tree var, bool toplevel, bool really_expand)
1590 unsigned int align = BITS_PER_UNIT;
1591 tree origvar = var;
1593 var = SSAVAR (var);
1595 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1597 if (is_global_var (var))
1598 return 0;
1600 /* Because we don't know if VAR will be in register or on stack,
1601 we conservatively assume it will be on stack even if VAR is
1602 eventually put into register after RA pass. For non-automatic
1603 variables, which won't be on stack, we collect alignment of
1604 type and ignore user specified alignment. Similarly for
1605 SSA_NAMEs for which use_register_for_decl returns true. */
1606 if (TREE_STATIC (var)
1607 || DECL_EXTERNAL (var)
1608 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1609 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1610 TYPE_MODE (TREE_TYPE (var)),
1611 TYPE_ALIGN (TREE_TYPE (var)));
1612 else if (DECL_HAS_VALUE_EXPR_P (var)
1613 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1614 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1615 or variables which were assigned a stack slot already by
1616 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1617 changed from the offset chosen to it. */
1618 align = crtl->stack_alignment_estimated;
1619 else
1620 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1622 /* If the variable alignment is very large we'll dynamicaly allocate
1623 it, which means that in-frame portion is just a pointer. */
1624 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1625 align = GET_MODE_ALIGNMENT (Pmode);
1628 record_alignment_for_reg_var (align);
1630 poly_uint64 size;
1631 if (TREE_CODE (origvar) == SSA_NAME)
1633 gcc_assert (!VAR_P (var)
1634 || (!DECL_EXTERNAL (var)
1635 && !DECL_HAS_VALUE_EXPR_P (var)
1636 && !TREE_STATIC (var)
1637 && TREE_TYPE (var) != error_mark_node
1638 && !DECL_HARD_REGISTER (var)
1639 && really_expand));
1641 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1643 else if (DECL_EXTERNAL (var))
1645 else if (DECL_HAS_VALUE_EXPR_P (var))
1647 else if (TREE_STATIC (var))
1649 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1651 else if (TREE_TYPE (var) == error_mark_node)
1653 if (really_expand)
1654 expand_one_error_var (var);
1656 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1658 if (really_expand)
1660 expand_one_hard_reg_var (var);
1661 if (!DECL_HARD_REGISTER (var))
1662 /* Invalid register specification. */
1663 expand_one_error_var (var);
1666 else if (use_register_for_decl (var))
1668 if (really_expand)
1669 expand_one_register_var (origvar);
1671 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1672 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1674 /* Reject variables which cover more than half of the address-space. */
1675 if (really_expand)
1677 if (DECL_NONLOCAL_FRAME (var))
1678 error_at (DECL_SOURCE_LOCATION (current_function_decl),
1679 "total size of local objects is too large");
1680 else
1681 error_at (DECL_SOURCE_LOCATION (var),
1682 "size of variable %q+D is too large", var);
1683 expand_one_error_var (var);
1686 else if (defer_stack_allocation (var, toplevel))
1687 add_stack_var (origvar);
1688 else
1690 if (really_expand)
1692 if (lookup_attribute ("naked",
1693 DECL_ATTRIBUTES (current_function_decl)))
1694 error ("cannot allocate stack for variable %q+D, naked function.",
1695 var);
1697 expand_one_stack_var (origvar);
1699 return size;
1701 return 0;
1704 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1705 expanding variables. Those variables that can be put into registers
1706 are allocated pseudos; those that can't are put on the stack.
1708 TOPLEVEL is true if this is the outermost BLOCK. */
1710 static void
1711 expand_used_vars_for_block (tree block, bool toplevel)
1713 tree t;
1715 /* Expand all variables at this level. */
1716 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1717 if (TREE_USED (t)
1718 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1719 || !DECL_NONSHAREABLE (t)))
1720 expand_one_var (t, toplevel, true);
1722 /* Expand all variables at containing levels. */
1723 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1724 expand_used_vars_for_block (t, false);
1727 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1728 and clear TREE_USED on all local variables. */
1730 static void
1731 clear_tree_used (tree block)
1733 tree t;
1735 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1736 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1737 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1738 || !DECL_NONSHAREABLE (t))
1739 TREE_USED (t) = 0;
1741 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1742 clear_tree_used (t);
1745 enum {
1746 SPCT_FLAG_DEFAULT = 1,
1747 SPCT_FLAG_ALL = 2,
1748 SPCT_FLAG_STRONG = 3,
1749 SPCT_FLAG_EXPLICIT = 4
1752 /* Examine TYPE and determine a bit mask of the following features. */
1754 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1755 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1756 #define SPCT_HAS_ARRAY 4
1757 #define SPCT_HAS_AGGREGATE 8
1759 static unsigned int
1760 stack_protect_classify_type (tree type)
1762 unsigned int ret = 0;
1763 tree t;
1765 switch (TREE_CODE (type))
1767 case ARRAY_TYPE:
1768 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1769 if (t == char_type_node
1770 || t == signed_char_type_node
1771 || t == unsigned_char_type_node)
1773 unsigned HOST_WIDE_INT max = PARAM_VALUE (PARAM_SSP_BUFFER_SIZE);
1774 unsigned HOST_WIDE_INT len;
1776 if (!TYPE_SIZE_UNIT (type)
1777 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1778 len = max;
1779 else
1780 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1782 if (len < max)
1783 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1784 else
1785 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1787 else
1788 ret = SPCT_HAS_ARRAY;
1789 break;
1791 case UNION_TYPE:
1792 case QUAL_UNION_TYPE:
1793 case RECORD_TYPE:
1794 ret = SPCT_HAS_AGGREGATE;
1795 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1796 if (TREE_CODE (t) == FIELD_DECL)
1797 ret |= stack_protect_classify_type (TREE_TYPE (t));
1798 break;
1800 default:
1801 break;
1804 return ret;
1807 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1808 part of the local stack frame. Remember if we ever return nonzero for
1809 any variable in this function. The return value is the phase number in
1810 which the variable should be allocated. */
1812 static int
1813 stack_protect_decl_phase (tree decl)
1815 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1816 int ret = 0;
1818 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1819 has_short_buffer = true;
1821 if (flag_stack_protect == SPCT_FLAG_ALL
1822 || flag_stack_protect == SPCT_FLAG_STRONG
1823 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1824 && lookup_attribute ("stack_protect",
1825 DECL_ATTRIBUTES (current_function_decl))))
1827 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1828 && !(bits & SPCT_HAS_AGGREGATE))
1829 ret = 1;
1830 else if (bits & SPCT_HAS_ARRAY)
1831 ret = 2;
1833 else
1834 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1836 if (ret)
1837 has_protected_decls = true;
1839 return ret;
1842 /* Two helper routines that check for phase 1 and phase 2. These are used
1843 as callbacks for expand_stack_vars. */
1845 static bool
1846 stack_protect_decl_phase_1 (size_t i)
1848 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1851 static bool
1852 stack_protect_decl_phase_2 (size_t i)
1854 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1857 /* And helper function that checks for asan phase (with stack protector
1858 it is phase 3). This is used as callback for expand_stack_vars.
1859 Returns true if any of the vars in the partition need to be protected. */
1861 static bool
1862 asan_decl_phase_3 (size_t i)
1864 while (i != EOC)
1866 if (asan_protect_stack_decl (stack_vars[i].decl))
1867 return true;
1868 i = stack_vars[i].next;
1870 return false;
1873 /* Ensure that variables in different stack protection phases conflict
1874 so that they are not merged and share the same stack slot. */
1876 static void
1877 add_stack_protection_conflicts (void)
1879 size_t i, j, n = stack_vars_num;
1880 unsigned char *phase;
1882 phase = XNEWVEC (unsigned char, n);
1883 for (i = 0; i < n; ++i)
1884 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1886 for (i = 0; i < n; ++i)
1888 unsigned char ph_i = phase[i];
1889 for (j = i + 1; j < n; ++j)
1890 if (ph_i != phase[j])
1891 add_stack_var_conflict (i, j);
1894 XDELETEVEC (phase);
1897 /* Create a decl for the guard at the top of the stack frame. */
1899 static void
1900 create_stack_guard (void)
1902 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1903 VAR_DECL, NULL, ptr_type_node);
1904 TREE_THIS_VOLATILE (guard) = 1;
1905 TREE_USED (guard) = 1;
1906 expand_one_stack_var (guard);
1907 crtl->stack_protect_guard = guard;
1910 /* Prepare for expanding variables. */
1911 static void
1912 init_vars_expansion (void)
1914 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1915 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1917 /* A map from decl to stack partition. */
1918 decl_to_stack_part = new hash_map<tree, size_t>;
1920 /* Initialize local stack smashing state. */
1921 has_protected_decls = false;
1922 has_short_buffer = false;
1925 /* Free up stack variable graph data. */
1926 static void
1927 fini_vars_expansion (void)
1929 bitmap_obstack_release (&stack_var_bitmap_obstack);
1930 if (stack_vars)
1931 XDELETEVEC (stack_vars);
1932 if (stack_vars_sorted)
1933 XDELETEVEC (stack_vars_sorted);
1934 stack_vars = NULL;
1935 stack_vars_sorted = NULL;
1936 stack_vars_alloc = stack_vars_num = 0;
1937 delete decl_to_stack_part;
1938 decl_to_stack_part = NULL;
1941 /* Make a fair guess for the size of the stack frame of the function
1942 in NODE. This doesn't have to be exact, the result is only used in
1943 the inline heuristics. So we don't want to run the full stack var
1944 packing algorithm (which is quadratic in the number of stack vars).
1945 Instead, we calculate the total size of all stack vars. This turns
1946 out to be a pretty fair estimate -- packing of stack vars doesn't
1947 happen very often. */
1949 HOST_WIDE_INT
1950 estimated_stack_frame_size (struct cgraph_node *node)
1952 poly_int64 size = 0;
1953 size_t i;
1954 tree var;
1955 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1957 push_cfun (fn);
1959 init_vars_expansion ();
1961 FOR_EACH_LOCAL_DECL (fn, i, var)
1962 if (auto_var_in_fn_p (var, fn->decl))
1963 size += expand_one_var (var, true, false);
1965 if (stack_vars_num > 0)
1967 /* Fake sorting the stack vars for account_stack_vars (). */
1968 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1969 for (i = 0; i < stack_vars_num; ++i)
1970 stack_vars_sorted[i] = i;
1971 size += account_stack_vars ();
1974 fini_vars_expansion ();
1975 pop_cfun ();
1976 return estimated_poly_value (size);
1979 /* Helper routine to check if a record or union contains an array field. */
1981 static int
1982 record_or_union_type_has_array_p (const_tree tree_type)
1984 tree fields = TYPE_FIELDS (tree_type);
1985 tree f;
1987 for (f = fields; f; f = DECL_CHAIN (f))
1988 if (TREE_CODE (f) == FIELD_DECL)
1990 tree field_type = TREE_TYPE (f);
1991 if (RECORD_OR_UNION_TYPE_P (field_type)
1992 && record_or_union_type_has_array_p (field_type))
1993 return 1;
1994 if (TREE_CODE (field_type) == ARRAY_TYPE)
1995 return 1;
1997 return 0;
2000 /* Check if the current function has local referenced variables that
2001 have their addresses taken, contain an array, or are arrays. */
2003 static bool
2004 stack_protect_decl_p ()
2006 unsigned i;
2007 tree var;
2009 FOR_EACH_LOCAL_DECL (cfun, i, var)
2010 if (!is_global_var (var))
2012 tree var_type = TREE_TYPE (var);
2013 if (VAR_P (var)
2014 && (TREE_CODE (var_type) == ARRAY_TYPE
2015 || TREE_ADDRESSABLE (var)
2016 || (RECORD_OR_UNION_TYPE_P (var_type)
2017 && record_or_union_type_has_array_p (var_type))))
2018 return true;
2020 return false;
2023 /* Check if the current function has calls that use a return slot. */
2025 static bool
2026 stack_protect_return_slot_p ()
2028 basic_block bb;
2030 FOR_ALL_BB_FN (bb, cfun)
2031 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2032 !gsi_end_p (gsi); gsi_next (&gsi))
2034 gimple *stmt = gsi_stmt (gsi);
2035 /* This assumes that calls to internal-only functions never
2036 use a return slot. */
2037 if (is_gimple_call (stmt)
2038 && !gimple_call_internal_p (stmt)
2039 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2040 gimple_call_fndecl (stmt)))
2041 return true;
2043 return false;
2046 /* Expand all variables used in the function. */
2048 static rtx_insn *
2049 expand_used_vars (void)
2051 tree var, outer_block = DECL_INITIAL (current_function_decl);
2052 auto_vec<tree> maybe_local_decls;
2053 rtx_insn *var_end_seq = NULL;
2054 unsigned i;
2055 unsigned len;
2056 bool gen_stack_protect_signal = false;
2058 /* Compute the phase of the stack frame for this function. */
2060 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2061 int off = targetm.starting_frame_offset () % align;
2062 frame_phase = off ? align - off : 0;
2065 /* Set TREE_USED on all variables in the local_decls. */
2066 FOR_EACH_LOCAL_DECL (cfun, i, var)
2067 TREE_USED (var) = 1;
2068 /* Clear TREE_USED on all variables associated with a block scope. */
2069 clear_tree_used (DECL_INITIAL (current_function_decl));
2071 init_vars_expansion ();
2073 if (targetm.use_pseudo_pic_reg ())
2074 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2076 for (i = 0; i < SA.map->num_partitions; i++)
2078 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2079 continue;
2081 tree var = partition_to_var (SA.map, i);
2083 gcc_assert (!virtual_operand_p (var));
2085 expand_one_ssa_partition (var);
2088 if (flag_stack_protect == SPCT_FLAG_STRONG)
2089 gen_stack_protect_signal
2090 = stack_protect_decl_p () || stack_protect_return_slot_p ();
2092 /* At this point all variables on the local_decls with TREE_USED
2093 set are not associated with any block scope. Lay them out. */
2095 len = vec_safe_length (cfun->local_decls);
2096 FOR_EACH_LOCAL_DECL (cfun, i, var)
2098 bool expand_now = false;
2100 /* Expanded above already. */
2101 if (is_gimple_reg (var))
2103 TREE_USED (var) = 0;
2104 goto next;
2106 /* We didn't set a block for static or extern because it's hard
2107 to tell the difference between a global variable (re)declared
2108 in a local scope, and one that's really declared there to
2109 begin with. And it doesn't really matter much, since we're
2110 not giving them stack space. Expand them now. */
2111 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2112 expand_now = true;
2114 /* Expand variables not associated with any block now. Those created by
2115 the optimizers could be live anywhere in the function. Those that
2116 could possibly have been scoped originally and detached from their
2117 block will have their allocation deferred so we coalesce them with
2118 others when optimization is enabled. */
2119 else if (TREE_USED (var))
2120 expand_now = true;
2122 /* Finally, mark all variables on the list as used. We'll use
2123 this in a moment when we expand those associated with scopes. */
2124 TREE_USED (var) = 1;
2126 if (expand_now)
2127 expand_one_var (var, true, true);
2129 next:
2130 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2132 rtx rtl = DECL_RTL_IF_SET (var);
2134 /* Keep artificial non-ignored vars in cfun->local_decls
2135 chain until instantiate_decls. */
2136 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2137 add_local_decl (cfun, var);
2138 else if (rtl == NULL_RTX)
2139 /* If rtl isn't set yet, which can happen e.g. with
2140 -fstack-protector, retry before returning from this
2141 function. */
2142 maybe_local_decls.safe_push (var);
2146 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2148 +-----------------+-----------------+
2149 | ...processed... | ...duplicates...|
2150 +-----------------+-----------------+
2152 +-- LEN points here.
2154 We just want the duplicates, as those are the artificial
2155 non-ignored vars that we want to keep until instantiate_decls.
2156 Move them down and truncate the array. */
2157 if (!vec_safe_is_empty (cfun->local_decls))
2158 cfun->local_decls->block_remove (0, len);
2160 /* At this point, all variables within the block tree with TREE_USED
2161 set are actually used by the optimized function. Lay them out. */
2162 expand_used_vars_for_block (outer_block, true);
2164 if (stack_vars_num > 0)
2166 add_scope_conflicts ();
2168 /* If stack protection is enabled, we don't share space between
2169 vulnerable data and non-vulnerable data. */
2170 if (flag_stack_protect != 0
2171 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2172 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2173 && lookup_attribute ("stack_protect",
2174 DECL_ATTRIBUTES (current_function_decl)))))
2175 add_stack_protection_conflicts ();
2177 /* Now that we have collected all stack variables, and have computed a
2178 minimal interference graph, attempt to save some stack space. */
2179 partition_stack_vars ();
2180 if (dump_file)
2181 dump_stack_var_partition ();
2184 switch (flag_stack_protect)
2186 case SPCT_FLAG_ALL:
2187 create_stack_guard ();
2188 break;
2190 case SPCT_FLAG_STRONG:
2191 if (gen_stack_protect_signal
2192 || cfun->calls_alloca || has_protected_decls
2193 || lookup_attribute ("stack_protect",
2194 DECL_ATTRIBUTES (current_function_decl)))
2195 create_stack_guard ();
2196 break;
2198 case SPCT_FLAG_DEFAULT:
2199 if (cfun->calls_alloca || has_protected_decls
2200 || lookup_attribute ("stack_protect",
2201 DECL_ATTRIBUTES (current_function_decl)))
2202 create_stack_guard ();
2203 break;
2205 case SPCT_FLAG_EXPLICIT:
2206 if (lookup_attribute ("stack_protect",
2207 DECL_ATTRIBUTES (current_function_decl)))
2208 create_stack_guard ();
2209 break;
2210 default:
2214 /* Assign rtl to each variable based on these partitions. */
2215 if (stack_vars_num > 0)
2217 struct stack_vars_data data;
2219 data.asan_base = NULL_RTX;
2220 data.asan_alignb = 0;
2222 /* Reorder decls to be protected by iterating over the variables
2223 array multiple times, and allocating out of each phase in turn. */
2224 /* ??? We could probably integrate this into the qsort we did
2225 earlier, such that we naturally see these variables first,
2226 and thus naturally allocate things in the right order. */
2227 if (has_protected_decls)
2229 /* Phase 1 contains only character arrays. */
2230 expand_stack_vars (stack_protect_decl_phase_1, &data);
2232 /* Phase 2 contains other kinds of arrays. */
2233 if (flag_stack_protect == SPCT_FLAG_ALL
2234 || flag_stack_protect == SPCT_FLAG_STRONG
2235 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2236 && lookup_attribute ("stack_protect",
2237 DECL_ATTRIBUTES (current_function_decl))))
2238 expand_stack_vars (stack_protect_decl_phase_2, &data);
2241 if (asan_sanitize_stack_p ())
2242 /* Phase 3, any partitions that need asan protection
2243 in addition to phase 1 and 2. */
2244 expand_stack_vars (asan_decl_phase_3, &data);
2246 /* ASAN description strings don't yet have a syntax for expressing
2247 polynomial offsets. */
2248 HOST_WIDE_INT prev_offset;
2249 if (!data.asan_vec.is_empty ()
2250 && frame_offset.is_constant (&prev_offset))
2252 HOST_WIDE_INT offset, sz, redzonesz;
2253 redzonesz = ASAN_RED_ZONE_SIZE;
2254 sz = data.asan_vec[0] - prev_offset;
2255 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2256 && data.asan_alignb <= 4096
2257 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2258 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2259 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2260 /* Allocating a constant amount of space from a constant
2261 starting offset must give a constant result. */
2262 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2263 .to_constant ());
2264 data.asan_vec.safe_push (prev_offset);
2265 data.asan_vec.safe_push (offset);
2266 /* Leave space for alignment if STRICT_ALIGNMENT. */
2267 if (STRICT_ALIGNMENT)
2268 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2269 << ASAN_SHADOW_SHIFT)
2270 / BITS_PER_UNIT, 1);
2272 var_end_seq
2273 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2274 data.asan_base,
2275 data.asan_alignb,
2276 data.asan_vec.address (),
2277 data.asan_decl_vec.address (),
2278 data.asan_vec.length ());
2281 expand_stack_vars (NULL, &data);
2284 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2285 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2286 virtual_stack_vars_rtx,
2287 var_end_seq);
2289 fini_vars_expansion ();
2291 /* If there were any artificial non-ignored vars without rtl
2292 found earlier, see if deferred stack allocation hasn't assigned
2293 rtl to them. */
2294 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2296 rtx rtl = DECL_RTL_IF_SET (var);
2298 /* Keep artificial non-ignored vars in cfun->local_decls
2299 chain until instantiate_decls. */
2300 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2301 add_local_decl (cfun, var);
2304 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2305 if (STACK_ALIGNMENT_NEEDED)
2307 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2308 if (FRAME_GROWS_DOWNWARD)
2309 frame_offset = aligned_lower_bound (frame_offset, align);
2310 else
2311 frame_offset = aligned_upper_bound (frame_offset, align);
2314 return var_end_seq;
2318 /* If we need to produce a detailed dump, print the tree representation
2319 for STMT to the dump file. SINCE is the last RTX after which the RTL
2320 generated for STMT should have been appended. */
2322 static void
2323 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2325 if (dump_file && (dump_flags & TDF_DETAILS))
2327 fprintf (dump_file, "\n;; ");
2328 print_gimple_stmt (dump_file, stmt, 0,
2329 TDF_SLIM | (dump_flags & TDF_LINENO));
2330 fprintf (dump_file, "\n");
2332 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2336 /* Maps the blocks that do not contain tree labels to rtx labels. */
2338 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2340 /* Returns the label_rtx expression for a label starting basic block BB. */
2342 static rtx_code_label *
2343 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2345 gimple_stmt_iterator gsi;
2346 tree lab;
2348 if (bb->flags & BB_RTL)
2349 return block_label (bb);
2351 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2352 if (elt)
2353 return *elt;
2355 /* Find the tree label if it is present. */
2357 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2359 glabel *lab_stmt;
2361 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2362 if (!lab_stmt)
2363 break;
2365 lab = gimple_label_label (lab_stmt);
2366 if (DECL_NONLOCAL (lab))
2367 break;
2369 return jump_target_rtx (lab);
2372 rtx_code_label *l = gen_label_rtx ();
2373 lab_rtx_for_bb->put (bb, l);
2374 return l;
2378 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2379 of a basic block where we just expanded the conditional at the end,
2380 possibly clean up the CFG and instruction sequence. LAST is the
2381 last instruction before the just emitted jump sequence. */
2383 static void
2384 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2386 /* Special case: when jumpif decides that the condition is
2387 trivial it emits an unconditional jump (and the necessary
2388 barrier). But we still have two edges, the fallthru one is
2389 wrong. purge_dead_edges would clean this up later. Unfortunately
2390 we have to insert insns (and split edges) before
2391 find_many_sub_basic_blocks and hence before purge_dead_edges.
2392 But splitting edges might create new blocks which depend on the
2393 fact that if there are two edges there's no barrier. So the
2394 barrier would get lost and verify_flow_info would ICE. Instead
2395 of auditing all edge splitters to care for the barrier (which
2396 normally isn't there in a cleaned CFG), fix it here. */
2397 if (BARRIER_P (get_last_insn ()))
2399 rtx_insn *insn;
2400 remove_edge (e);
2401 /* Now, we have a single successor block, if we have insns to
2402 insert on the remaining edge we potentially will insert
2403 it at the end of this block (if the dest block isn't feasible)
2404 in order to avoid splitting the edge. This insertion will take
2405 place in front of the last jump. But we might have emitted
2406 multiple jumps (conditional and one unconditional) to the
2407 same destination. Inserting in front of the last one then
2408 is a problem. See PR 40021. We fix this by deleting all
2409 jumps except the last unconditional one. */
2410 insn = PREV_INSN (get_last_insn ());
2411 /* Make sure we have an unconditional jump. Otherwise we're
2412 confused. */
2413 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2414 for (insn = PREV_INSN (insn); insn != last;)
2416 insn = PREV_INSN (insn);
2417 if (JUMP_P (NEXT_INSN (insn)))
2419 if (!any_condjump_p (NEXT_INSN (insn)))
2421 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2422 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2424 delete_insn (NEXT_INSN (insn));
2430 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2431 Returns a new basic block if we've terminated the current basic
2432 block and created a new one. */
2434 static basic_block
2435 expand_gimple_cond (basic_block bb, gcond *stmt)
2437 basic_block new_bb, dest;
2438 edge true_edge;
2439 edge false_edge;
2440 rtx_insn *last2, *last;
2441 enum tree_code code;
2442 tree op0, op1;
2444 code = gimple_cond_code (stmt);
2445 op0 = gimple_cond_lhs (stmt);
2446 op1 = gimple_cond_rhs (stmt);
2447 /* We're sometimes presented with such code:
2448 D.123_1 = x < y;
2449 if (D.123_1 != 0)
2451 This would expand to two comparisons which then later might
2452 be cleaned up by combine. But some pattern matchers like if-conversion
2453 work better when there's only one compare, so make up for this
2454 here as special exception if TER would have made the same change. */
2455 if (SA.values
2456 && TREE_CODE (op0) == SSA_NAME
2457 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2458 && TREE_CODE (op1) == INTEGER_CST
2459 && ((gimple_cond_code (stmt) == NE_EXPR
2460 && integer_zerop (op1))
2461 || (gimple_cond_code (stmt) == EQ_EXPR
2462 && integer_onep (op1)))
2463 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2465 gimple *second = SSA_NAME_DEF_STMT (op0);
2466 if (gimple_code (second) == GIMPLE_ASSIGN)
2468 enum tree_code code2 = gimple_assign_rhs_code (second);
2469 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2471 code = code2;
2472 op0 = gimple_assign_rhs1 (second);
2473 op1 = gimple_assign_rhs2 (second);
2475 /* If jumps are cheap and the target does not support conditional
2476 compare, turn some more codes into jumpy sequences. */
2477 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2478 && targetm.gen_ccmp_first == NULL)
2480 if ((code2 == BIT_AND_EXPR
2481 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2482 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2483 || code2 == TRUTH_AND_EXPR)
2485 code = TRUTH_ANDIF_EXPR;
2486 op0 = gimple_assign_rhs1 (second);
2487 op1 = gimple_assign_rhs2 (second);
2489 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2491 code = TRUTH_ORIF_EXPR;
2492 op0 = gimple_assign_rhs1 (second);
2493 op1 = gimple_assign_rhs2 (second);
2499 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2500 into (x - C2) * C3 < C4. */
2501 if ((code == EQ_EXPR || code == NE_EXPR)
2502 && TREE_CODE (op0) == SSA_NAME
2503 && TREE_CODE (op1) == INTEGER_CST)
2504 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2506 last2 = last = get_last_insn ();
2508 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2509 set_curr_insn_location (gimple_location (stmt));
2511 /* These flags have no purpose in RTL land. */
2512 true_edge->flags &= ~EDGE_TRUE_VALUE;
2513 false_edge->flags &= ~EDGE_FALSE_VALUE;
2515 /* We can either have a pure conditional jump with one fallthru edge or
2516 two-way jump that needs to be decomposed into two basic blocks. */
2517 if (false_edge->dest == bb->next_bb)
2519 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2520 true_edge->probability);
2521 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2522 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2523 set_curr_insn_location (true_edge->goto_locus);
2524 false_edge->flags |= EDGE_FALLTHRU;
2525 maybe_cleanup_end_of_block (false_edge, last);
2526 return NULL;
2528 if (true_edge->dest == bb->next_bb)
2530 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2531 false_edge->probability);
2532 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2533 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2534 set_curr_insn_location (false_edge->goto_locus);
2535 true_edge->flags |= EDGE_FALLTHRU;
2536 maybe_cleanup_end_of_block (true_edge, last);
2537 return NULL;
2540 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2541 true_edge->probability);
2542 last = get_last_insn ();
2543 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2544 set_curr_insn_location (false_edge->goto_locus);
2545 emit_jump (label_rtx_for_bb (false_edge->dest));
2547 BB_END (bb) = last;
2548 if (BARRIER_P (BB_END (bb)))
2549 BB_END (bb) = PREV_INSN (BB_END (bb));
2550 update_bb_for_insn (bb);
2552 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2553 dest = false_edge->dest;
2554 redirect_edge_succ (false_edge, new_bb);
2555 false_edge->flags |= EDGE_FALLTHRU;
2556 new_bb->count = false_edge->count ();
2557 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2558 add_bb_to_loop (new_bb, loop);
2559 if (loop->latch == bb
2560 && loop->header == dest)
2561 loop->latch = new_bb;
2562 make_single_succ_edge (new_bb, dest, 0);
2563 if (BARRIER_P (BB_END (new_bb)))
2564 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2565 update_bb_for_insn (new_bb);
2567 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2569 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2571 set_curr_insn_location (true_edge->goto_locus);
2572 true_edge->goto_locus = curr_insn_location ();
2575 return new_bb;
2578 /* Mark all calls that can have a transaction restart. */
2580 static void
2581 mark_transaction_restart_calls (gimple *stmt)
2583 struct tm_restart_node dummy;
2584 tm_restart_node **slot;
2586 if (!cfun->gimple_df->tm_restart)
2587 return;
2589 dummy.stmt = stmt;
2590 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2591 if (slot)
2593 struct tm_restart_node *n = *slot;
2594 tree list = n->label_or_list;
2595 rtx_insn *insn;
2597 for (insn = next_real_insn (get_last_insn ());
2598 !CALL_P (insn);
2599 insn = next_real_insn (insn))
2600 continue;
2602 if (TREE_CODE (list) == LABEL_DECL)
2603 add_reg_note (insn, REG_TM, label_rtx (list));
2604 else
2605 for (; list ; list = TREE_CHAIN (list))
2606 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2610 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2611 statement STMT. */
2613 static void
2614 expand_call_stmt (gcall *stmt)
2616 tree exp, decl, lhs;
2617 bool builtin_p;
2618 size_t i;
2620 if (gimple_call_internal_p (stmt))
2622 expand_internal_call (stmt);
2623 return;
2626 /* If this is a call to a built-in function and it has no effect other
2627 than setting the lhs, try to implement it using an internal function
2628 instead. */
2629 decl = gimple_call_fndecl (stmt);
2630 if (gimple_call_lhs (stmt)
2631 && !gimple_has_side_effects (stmt)
2632 && (optimize || (decl && called_as_built_in (decl))))
2634 internal_fn ifn = replacement_internal_fn (stmt);
2635 if (ifn != IFN_LAST)
2637 expand_internal_call (ifn, stmt);
2638 return;
2642 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2644 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2645 builtin_p = decl && fndecl_built_in_p (decl);
2647 /* If this is not a builtin function, the function type through which the
2648 call is made may be different from the type of the function. */
2649 if (!builtin_p)
2650 CALL_EXPR_FN (exp)
2651 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2652 CALL_EXPR_FN (exp));
2654 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2655 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2657 for (i = 0; i < gimple_call_num_args (stmt); i++)
2659 tree arg = gimple_call_arg (stmt, i);
2660 gimple *def;
2661 /* TER addresses into arguments of builtin functions so we have a
2662 chance to infer more correct alignment information. See PR39954. */
2663 if (builtin_p
2664 && TREE_CODE (arg) == SSA_NAME
2665 && (def = get_gimple_for_ssa_name (arg))
2666 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2667 arg = gimple_assign_rhs1 (def);
2668 CALL_EXPR_ARG (exp, i) = arg;
2671 if (gimple_has_side_effects (stmt))
2672 TREE_SIDE_EFFECTS (exp) = 1;
2674 if (gimple_call_nothrow_p (stmt))
2675 TREE_NOTHROW (exp) = 1;
2677 if (gimple_no_warning_p (stmt))
2678 TREE_NO_WARNING (exp) = 1;
2680 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2681 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2682 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2683 if (decl
2684 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2685 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2686 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2687 else
2688 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2689 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2690 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2691 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2693 /* Ensure RTL is created for debug args. */
2694 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2696 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2697 unsigned int ix;
2698 tree dtemp;
2700 if (debug_args)
2701 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2703 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2704 expand_debug_expr (dtemp);
2708 rtx_insn *before_call = get_last_insn ();
2709 lhs = gimple_call_lhs (stmt);
2710 if (lhs)
2711 expand_assignment (lhs, exp, false);
2712 else
2713 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2715 /* If the gimple call is an indirect call and has 'nocf_check'
2716 attribute find a generated CALL insn to mark it as no
2717 control-flow verification is needed. */
2718 if (gimple_call_nocf_check_p (stmt)
2719 && !gimple_call_fndecl (stmt))
2721 rtx_insn *last = get_last_insn ();
2722 while (!CALL_P (last)
2723 && last != before_call)
2724 last = PREV_INSN (last);
2726 if (last != before_call)
2727 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2730 mark_transaction_restart_calls (stmt);
2734 /* Generate RTL for an asm statement (explicit assembler code).
2735 STRING is a STRING_CST node containing the assembler code text,
2736 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2737 insn is volatile; don't optimize it. */
2739 static void
2740 expand_asm_loc (tree string, int vol, location_t locus)
2742 rtx body;
2744 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2745 ggc_strdup (TREE_STRING_POINTER (string)),
2746 locus);
2748 MEM_VOLATILE_P (body) = vol;
2750 /* Non-empty basic ASM implicitly clobbers memory. */
2751 if (TREE_STRING_LENGTH (string) != 0)
2753 rtx asm_op, clob;
2754 unsigned i, nclobbers;
2755 auto_vec<rtx> input_rvec, output_rvec;
2756 auto_vec<const char *> constraints;
2757 auto_vec<rtx> clobber_rvec;
2758 HARD_REG_SET clobbered_regs;
2759 CLEAR_HARD_REG_SET (clobbered_regs);
2761 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2762 clobber_rvec.safe_push (clob);
2764 if (targetm.md_asm_adjust)
2765 targetm.md_asm_adjust (output_rvec, input_rvec,
2766 constraints, clobber_rvec,
2767 clobbered_regs);
2769 asm_op = body;
2770 nclobbers = clobber_rvec.length ();
2771 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nclobbers));
2773 XVECEXP (body, 0, 0) = asm_op;
2774 for (i = 0; i < nclobbers; i++)
2775 XVECEXP (body, 0, i + 1) = gen_rtx_CLOBBER (VOIDmode, clobber_rvec[i]);
2778 emit_insn (body);
2781 /* Return the number of times character C occurs in string S. */
2782 static int
2783 n_occurrences (int c, const char *s)
2785 int n = 0;
2786 while (*s)
2787 n += (*s++ == c);
2788 return n;
2791 /* A subroutine of expand_asm_operands. Check that all operands have
2792 the same number of alternatives. Return true if so. */
2794 static bool
2795 check_operand_nalternatives (const vec<const char *> &constraints)
2797 unsigned len = constraints.length();
2798 if (len > 0)
2800 int nalternatives = n_occurrences (',', constraints[0]);
2802 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2804 error ("too many alternatives in %<asm%>");
2805 return false;
2808 for (unsigned i = 1; i < len; ++i)
2809 if (n_occurrences (',', constraints[i]) != nalternatives)
2811 error ("operand constraints for %<asm%> differ "
2812 "in number of alternatives");
2813 return false;
2816 return true;
2819 /* Check for overlap between registers marked in CLOBBERED_REGS and
2820 anything inappropriate in T. Emit error and return the register
2821 variable definition for error, NULL_TREE for ok. */
2823 static bool
2824 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2826 /* Conflicts between asm-declared register variables and the clobber
2827 list are not allowed. */
2828 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2830 if (overlap)
2832 error ("asm-specifier for variable %qE conflicts with asm clobber list",
2833 DECL_NAME (overlap));
2835 /* Reset registerness to stop multiple errors emitted for a single
2836 variable. */
2837 DECL_REGISTER (overlap) = 0;
2838 return true;
2841 return false;
2844 /* Generate RTL for an asm statement with arguments.
2845 STRING is the instruction template.
2846 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2847 Each output or input has an expression in the TREE_VALUE and
2848 a tree list in TREE_PURPOSE which in turn contains a constraint
2849 name in TREE_VALUE (or NULL_TREE) and a constraint string
2850 in TREE_PURPOSE.
2851 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2852 that is clobbered by this insn.
2854 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2855 should be the fallthru basic block of the asm goto.
2857 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2858 Some elements of OUTPUTS may be replaced with trees representing temporary
2859 values. The caller should copy those temporary values to the originally
2860 specified lvalues.
2862 VOL nonzero means the insn is volatile; don't optimize it. */
2864 static void
2865 expand_asm_stmt (gasm *stmt)
2867 class save_input_location
2869 location_t old;
2871 public:
2872 explicit save_input_location(location_t where)
2874 old = input_location;
2875 input_location = where;
2878 ~save_input_location()
2880 input_location = old;
2884 location_t locus = gimple_location (stmt);
2886 if (gimple_asm_input_p (stmt))
2888 const char *s = gimple_asm_string (stmt);
2889 tree string = build_string (strlen (s), s);
2890 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
2891 return;
2894 /* There are some legacy diagnostics in here, and also avoids a
2895 sixth parameger to targetm.md_asm_adjust. */
2896 save_input_location s_i_l(locus);
2898 unsigned noutputs = gimple_asm_noutputs (stmt);
2899 unsigned ninputs = gimple_asm_ninputs (stmt);
2900 unsigned nlabels = gimple_asm_nlabels (stmt);
2901 unsigned i;
2903 /* ??? Diagnose during gimplification? */
2904 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
2906 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2907 return;
2910 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
2911 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
2912 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
2914 /* Copy the gimple vectors into new vectors that we can manipulate. */
2916 output_tvec.safe_grow (noutputs);
2917 input_tvec.safe_grow (ninputs);
2918 constraints.safe_grow (noutputs + ninputs);
2920 for (i = 0; i < noutputs; ++i)
2922 tree t = gimple_asm_output_op (stmt, i);
2923 output_tvec[i] = TREE_VALUE (t);
2924 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2926 for (i = 0; i < ninputs; i++)
2928 tree t = gimple_asm_input_op (stmt, i);
2929 input_tvec[i] = TREE_VALUE (t);
2930 constraints[i + noutputs]
2931 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2934 /* ??? Diagnose during gimplification? */
2935 if (! check_operand_nalternatives (constraints))
2936 return;
2938 /* Count the number of meaningful clobbered registers, ignoring what
2939 we would ignore later. */
2940 auto_vec<rtx> clobber_rvec;
2941 HARD_REG_SET clobbered_regs;
2942 CLEAR_HARD_REG_SET (clobbered_regs);
2944 if (unsigned n = gimple_asm_nclobbers (stmt))
2946 clobber_rvec.reserve (n);
2947 for (i = 0; i < n; i++)
2949 tree t = gimple_asm_clobber_op (stmt, i);
2950 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
2951 int nregs, j;
2953 j = decode_reg_name_and_count (regname, &nregs);
2954 if (j < 0)
2956 if (j == -2)
2958 /* ??? Diagnose during gimplification? */
2959 error ("unknown register name %qs in %<asm%>", regname);
2961 else if (j == -4)
2963 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2964 clobber_rvec.safe_push (x);
2966 else
2968 /* Otherwise we should have -1 == empty string
2969 or -3 == cc, which is not a register. */
2970 gcc_assert (j == -1 || j == -3);
2973 else
2974 for (int reg = j; reg < j + nregs; reg++)
2976 /* Clobbering the PIC register is an error. */
2977 if (reg == (int) PIC_OFFSET_TABLE_REGNUM)
2979 /* ??? Diagnose during gimplification? */
2980 error ("PIC register clobbered by %qs in %<asm%>",
2981 regname);
2982 return;
2985 SET_HARD_REG_BIT (clobbered_regs, reg);
2986 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
2987 clobber_rvec.safe_push (x);
2991 unsigned nclobbers = clobber_rvec.length();
2993 /* First pass over inputs and outputs checks validity and sets
2994 mark_addressable if needed. */
2995 /* ??? Diagnose during gimplification? */
2997 for (i = 0; i < noutputs; ++i)
2999 tree val = output_tvec[i];
3000 tree type = TREE_TYPE (val);
3001 const char *constraint;
3002 bool is_inout;
3003 bool allows_reg;
3004 bool allows_mem;
3006 /* Try to parse the output constraint. If that fails, there's
3007 no point in going further. */
3008 constraint = constraints[i];
3009 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
3010 &allows_mem, &allows_reg, &is_inout))
3011 return;
3013 /* If the output is a hard register, verify it doesn't conflict with
3014 any other operand's possible hard register use. */
3015 if (DECL_P (val)
3016 && REG_P (DECL_RTL (val))
3017 && HARD_REGISTER_P (DECL_RTL (val)))
3019 unsigned j, output_hregno = REGNO (DECL_RTL (val));
3020 bool early_clobber_p = strchr (constraints[i], '&') != NULL;
3021 unsigned long match;
3023 /* Verify the other outputs do not use the same hard register. */
3024 for (j = i + 1; j < noutputs; ++j)
3025 if (DECL_P (output_tvec[j])
3026 && REG_P (DECL_RTL (output_tvec[j]))
3027 && HARD_REGISTER_P (DECL_RTL (output_tvec[j]))
3028 && output_hregno == REGNO (DECL_RTL (output_tvec[j])))
3029 error ("invalid hard register usage between output operands");
3031 /* Verify matching constraint operands use the same hard register
3032 and that the non-matching constraint operands do not use the same
3033 hard register if the output is an early clobber operand. */
3034 for (j = 0; j < ninputs; ++j)
3035 if (DECL_P (input_tvec[j])
3036 && REG_P (DECL_RTL (input_tvec[j]))
3037 && HARD_REGISTER_P (DECL_RTL (input_tvec[j])))
3039 unsigned input_hregno = REGNO (DECL_RTL (input_tvec[j]));
3040 switch (*constraints[j + noutputs])
3042 case '0': case '1': case '2': case '3': case '4':
3043 case '5': case '6': case '7': case '8': case '9':
3044 match = strtoul (constraints[j + noutputs], NULL, 10);
3045 break;
3046 default:
3047 match = ULONG_MAX;
3048 break;
3050 if (i == match
3051 && output_hregno != input_hregno)
3052 error ("invalid hard register usage between output operand "
3053 "and matching constraint operand");
3054 else if (early_clobber_p
3055 && i != match
3056 && output_hregno == input_hregno)
3057 error ("invalid hard register usage between earlyclobber "
3058 "operand and input operand");
3062 if (! allows_reg
3063 && (allows_mem
3064 || is_inout
3065 || (DECL_P (val)
3066 && REG_P (DECL_RTL (val))
3067 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3068 mark_addressable (val);
3071 for (i = 0; i < ninputs; ++i)
3073 bool allows_reg, allows_mem;
3074 const char *constraint;
3076 constraint = constraints[i + noutputs];
3077 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3078 constraints.address (),
3079 &allows_mem, &allows_reg))
3080 return;
3082 if (! allows_reg && allows_mem)
3083 mark_addressable (input_tvec[i]);
3086 /* Second pass evaluates arguments. */
3088 /* Make sure stack is consistent for asm goto. */
3089 if (nlabels > 0)
3090 do_pending_stack_adjust ();
3091 int old_generating_concat_p = generating_concat_p;
3093 /* Vector of RTX's of evaluated output operands. */
3094 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3095 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3096 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3098 output_rvec.safe_grow (noutputs);
3100 for (i = 0; i < noutputs; ++i)
3102 tree val = output_tvec[i];
3103 tree type = TREE_TYPE (val);
3104 bool is_inout, allows_reg, allows_mem, ok;
3105 rtx op;
3107 ok = parse_output_constraint (&constraints[i], i, ninputs,
3108 noutputs, &allows_mem, &allows_reg,
3109 &is_inout);
3110 gcc_assert (ok);
3112 /* If an output operand is not a decl or indirect ref and our constraint
3113 allows a register, make a temporary to act as an intermediate.
3114 Make the asm insn write into that, then we will copy it to
3115 the real output operand. Likewise for promoted variables. */
3117 generating_concat_p = 0;
3119 if ((TREE_CODE (val) == INDIRECT_REF && allows_mem)
3120 || (DECL_P (val)
3121 && (allows_mem || REG_P (DECL_RTL (val)))
3122 && ! (REG_P (DECL_RTL (val))
3123 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3124 || ! allows_reg
3125 || is_inout
3126 || TREE_ADDRESSABLE (type))
3128 op = expand_expr (val, NULL_RTX, VOIDmode,
3129 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3130 if (MEM_P (op))
3131 op = validize_mem (op);
3133 if (! allows_reg && !MEM_P (op))
3134 error ("output number %d not directly addressable", i);
3135 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3136 || GET_CODE (op) == CONCAT)
3138 rtx old_op = op;
3139 op = gen_reg_rtx (GET_MODE (op));
3141 generating_concat_p = old_generating_concat_p;
3143 if (is_inout)
3144 emit_move_insn (op, old_op);
3146 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3147 emit_move_insn (old_op, op);
3148 after_rtl_seq = get_insns ();
3149 after_rtl_end = get_last_insn ();
3150 end_sequence ();
3153 else
3155 op = assign_temp (type, 0, 1);
3156 op = validize_mem (op);
3157 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3158 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3160 generating_concat_p = old_generating_concat_p;
3162 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3163 expand_assignment (val, make_tree (type, op), false);
3164 after_rtl_seq = get_insns ();
3165 after_rtl_end = get_last_insn ();
3166 end_sequence ();
3168 output_rvec[i] = op;
3170 if (is_inout)
3171 inout_opnum.safe_push (i);
3174 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3175 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3177 input_rvec.safe_grow (ninputs);
3178 input_mode.safe_grow (ninputs);
3180 generating_concat_p = 0;
3182 for (i = 0; i < ninputs; ++i)
3184 tree val = input_tvec[i];
3185 tree type = TREE_TYPE (val);
3186 bool allows_reg, allows_mem, ok;
3187 const char *constraint;
3188 rtx op;
3190 constraint = constraints[i + noutputs];
3191 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3192 constraints.address (),
3193 &allows_mem, &allows_reg);
3194 gcc_assert (ok);
3196 /* EXPAND_INITIALIZER will not generate code for valid initializer
3197 constants, but will still generate code for other types of operand.
3198 This is the behavior we want for constant constraints. */
3199 op = expand_expr (val, NULL_RTX, VOIDmode,
3200 allows_reg ? EXPAND_NORMAL
3201 : allows_mem ? EXPAND_MEMORY
3202 : EXPAND_INITIALIZER);
3204 /* Never pass a CONCAT to an ASM. */
3205 if (GET_CODE (op) == CONCAT)
3206 op = force_reg (GET_MODE (op), op);
3207 else if (MEM_P (op))
3208 op = validize_mem (op);
3210 if (asm_operand_ok (op, constraint, NULL) <= 0)
3212 if (allows_reg && TYPE_MODE (type) != BLKmode)
3213 op = force_reg (TYPE_MODE (type), op);
3214 else if (!allows_mem)
3215 warning (0, "asm operand %d probably doesn%'t match constraints",
3216 i + noutputs);
3217 else if (MEM_P (op))
3219 /* We won't recognize either volatile memory or memory
3220 with a queued address as available a memory_operand
3221 at this point. Ignore it: clearly this *is* a memory. */
3223 else
3224 gcc_unreachable ();
3226 input_rvec[i] = op;
3227 input_mode[i] = TYPE_MODE (type);
3230 /* For in-out operands, copy output rtx to input rtx. */
3231 unsigned ninout = inout_opnum.length();
3232 for (i = 0; i < ninout; i++)
3234 int j = inout_opnum[i];
3235 rtx o = output_rvec[j];
3237 input_rvec.safe_push (o);
3238 input_mode.safe_push (GET_MODE (o));
3240 char buffer[16];
3241 sprintf (buffer, "%d", j);
3242 constraints.safe_push (ggc_strdup (buffer));
3244 ninputs += ninout;
3246 /* Sometimes we wish to automatically clobber registers across an asm.
3247 Case in point is when the i386 backend moved from cc0 to a hard reg --
3248 maintaining source-level compatibility means automatically clobbering
3249 the flags register. */
3250 rtx_insn *after_md_seq = NULL;
3251 if (targetm.md_asm_adjust)
3252 after_md_seq = targetm.md_asm_adjust (output_rvec, input_rvec,
3253 constraints, clobber_rvec,
3254 clobbered_regs);
3256 /* Do not allow the hook to change the output and input count,
3257 lest it mess up the operand numbering. */
3258 gcc_assert (output_rvec.length() == noutputs);
3259 gcc_assert (input_rvec.length() == ninputs);
3260 gcc_assert (constraints.length() == noutputs + ninputs);
3262 /* But it certainly can adjust the clobbers. */
3263 nclobbers = clobber_rvec.length();
3265 /* Third pass checks for easy conflicts. */
3266 /* ??? Why are we doing this on trees instead of rtx. */
3268 bool clobber_conflict_found = 0;
3269 for (i = 0; i < noutputs; ++i)
3270 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3271 clobber_conflict_found = 1;
3272 for (i = 0; i < ninputs - ninout; ++i)
3273 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3274 clobber_conflict_found = 1;
3276 /* Make vectors for the expression-rtx, constraint strings,
3277 and named operands. */
3279 rtvec argvec = rtvec_alloc (ninputs);
3280 rtvec constraintvec = rtvec_alloc (ninputs);
3281 rtvec labelvec = rtvec_alloc (nlabels);
3283 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3284 : GET_MODE (output_rvec[0])),
3285 ggc_strdup (gimple_asm_string (stmt)),
3286 "", 0, argvec, constraintvec,
3287 labelvec, locus);
3288 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3290 for (i = 0; i < ninputs; ++i)
3292 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3293 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3294 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3295 constraints[i + noutputs],
3296 locus);
3299 /* Copy labels to the vector. */
3300 rtx_code_label *fallthru_label = NULL;
3301 if (nlabels > 0)
3303 basic_block fallthru_bb = NULL;
3304 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3305 if (fallthru)
3306 fallthru_bb = fallthru->dest;
3308 for (i = 0; i < nlabels; ++i)
3310 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3311 rtx_insn *r;
3312 /* If asm goto has any labels in the fallthru basic block, use
3313 a label that we emit immediately after the asm goto. Expansion
3314 may insert further instructions into the same basic block after
3315 asm goto and if we don't do this, insertion of instructions on
3316 the fallthru edge might misbehave. See PR58670. */
3317 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3319 if (fallthru_label == NULL_RTX)
3320 fallthru_label = gen_label_rtx ();
3321 r = fallthru_label;
3323 else
3324 r = label_rtx (label);
3325 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3329 /* Now, for each output, construct an rtx
3330 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3331 ARGVEC CONSTRAINTS OPNAMES))
3332 If there is more than one, put them inside a PARALLEL. */
3334 if (nlabels > 0 && nclobbers == 0)
3336 gcc_assert (noutputs == 0);
3337 emit_jump_insn (body);
3339 else if (noutputs == 0 && nclobbers == 0)
3341 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3342 emit_insn (body);
3344 else if (noutputs == 1 && nclobbers == 0)
3346 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3347 emit_insn (gen_rtx_SET (output_rvec[0], body));
3349 else
3351 rtx obody = body;
3352 int num = noutputs;
3354 if (num == 0)
3355 num = 1;
3357 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3359 /* For each output operand, store a SET. */
3360 for (i = 0; i < noutputs; ++i)
3362 rtx src, o = output_rvec[i];
3363 if (i == 0)
3365 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3366 src = obody;
3368 else
3370 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3371 ASM_OPERANDS_TEMPLATE (obody),
3372 constraints[i], i, argvec,
3373 constraintvec, labelvec, locus);
3374 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3376 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3379 /* If there are no outputs (but there are some clobbers)
3380 store the bare ASM_OPERANDS into the PARALLEL. */
3381 if (i == 0)
3382 XVECEXP (body, 0, i++) = obody;
3384 /* Store (clobber REG) for each clobbered register specified. */
3385 for (unsigned j = 0; j < nclobbers; ++j)
3387 rtx clobbered_reg = clobber_rvec[j];
3389 /* Do sanity check for overlap between clobbers and respectively
3390 input and outputs that hasn't been handled. Such overlap
3391 should have been detected and reported above. */
3392 if (!clobber_conflict_found && REG_P (clobbered_reg))
3394 /* We test the old body (obody) contents to avoid
3395 tripping over the under-construction body. */
3396 for (unsigned k = 0; k < noutputs; ++k)
3397 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3398 internal_error ("asm clobber conflict with output operand");
3400 for (unsigned k = 0; k < ninputs - ninout; ++k)
3401 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3402 internal_error ("asm clobber conflict with input operand");
3405 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3408 if (nlabels > 0)
3409 emit_jump_insn (body);
3410 else
3411 emit_insn (body);
3414 generating_concat_p = old_generating_concat_p;
3416 if (fallthru_label)
3417 emit_label (fallthru_label);
3419 if (after_md_seq)
3420 emit_insn (after_md_seq);
3421 if (after_rtl_seq)
3422 emit_insn (after_rtl_seq);
3424 free_temp_slots ();
3425 crtl->has_asm_statement = 1;
3428 /* Emit code to jump to the address
3429 specified by the pointer expression EXP. */
3431 static void
3432 expand_computed_goto (tree exp)
3434 rtx x = expand_normal (exp);
3436 do_pending_stack_adjust ();
3437 emit_indirect_jump (x);
3440 /* Generate RTL code for a `goto' statement with target label LABEL.
3441 LABEL should be a LABEL_DECL tree node that was or will later be
3442 defined with `expand_label'. */
3444 static void
3445 expand_goto (tree label)
3447 if (flag_checking)
3449 /* Check for a nonlocal goto to a containing function. Should have
3450 gotten translated to __builtin_nonlocal_goto. */
3451 tree context = decl_function_context (label);
3452 gcc_assert (!context || context == current_function_decl);
3455 emit_jump (jump_target_rtx (label));
3458 /* Output a return with no value. */
3460 static void
3461 expand_null_return_1 (void)
3463 clear_pending_stack_adjust ();
3464 do_pending_stack_adjust ();
3465 emit_jump (return_label);
3468 /* Generate RTL to return from the current function, with no value.
3469 (That is, we do not do anything about returning any value.) */
3471 void
3472 expand_null_return (void)
3474 /* If this function was declared to return a value, but we
3475 didn't, clobber the return registers so that they are not
3476 propagated live to the rest of the function. */
3477 clobber_return_register ();
3479 expand_null_return_1 ();
3482 /* Generate RTL to return from the current function, with value VAL. */
3484 static void
3485 expand_value_return (rtx val)
3487 /* Copy the value to the return location unless it's already there. */
3489 tree decl = DECL_RESULT (current_function_decl);
3490 rtx return_reg = DECL_RTL (decl);
3491 if (return_reg != val)
3493 tree funtype = TREE_TYPE (current_function_decl);
3494 tree type = TREE_TYPE (decl);
3495 int unsignedp = TYPE_UNSIGNED (type);
3496 machine_mode old_mode = DECL_MODE (decl);
3497 machine_mode mode;
3498 if (DECL_BY_REFERENCE (decl))
3499 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3500 else
3501 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3503 if (mode != old_mode)
3504 val = convert_modes (mode, old_mode, val, unsignedp);
3506 if (GET_CODE (return_reg) == PARALLEL)
3507 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3508 else
3509 emit_move_insn (return_reg, val);
3512 expand_null_return_1 ();
3515 /* Generate RTL to evaluate the expression RETVAL and return it
3516 from the current function. */
3518 static void
3519 expand_return (tree retval)
3521 rtx result_rtl;
3522 rtx val = 0;
3523 tree retval_rhs;
3525 /* If function wants no value, give it none. */
3526 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3528 expand_normal (retval);
3529 expand_null_return ();
3530 return;
3533 if (retval == error_mark_node)
3535 /* Treat this like a return of no value from a function that
3536 returns a value. */
3537 expand_null_return ();
3538 return;
3540 else if ((TREE_CODE (retval) == MODIFY_EXPR
3541 || TREE_CODE (retval) == INIT_EXPR)
3542 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3543 retval_rhs = TREE_OPERAND (retval, 1);
3544 else
3545 retval_rhs = retval;
3547 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3549 /* If we are returning the RESULT_DECL, then the value has already
3550 been stored into it, so we don't have to do anything special. */
3551 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3552 expand_value_return (result_rtl);
3554 /* If the result is an aggregate that is being returned in one (or more)
3555 registers, load the registers here. */
3557 else if (retval_rhs != 0
3558 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3559 && REG_P (result_rtl))
3561 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3562 if (val)
3564 /* Use the mode of the result value on the return register. */
3565 PUT_MODE (result_rtl, GET_MODE (val));
3566 expand_value_return (val);
3568 else
3569 expand_null_return ();
3571 else if (retval_rhs != 0
3572 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3573 && (REG_P (result_rtl)
3574 || (GET_CODE (result_rtl) == PARALLEL)))
3576 /* Compute the return value into a temporary (usually a pseudo reg). */
3578 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3579 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3580 val = force_not_mem (val);
3581 expand_value_return (val);
3583 else
3585 /* No hard reg used; calculate value into hard return reg. */
3586 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3587 expand_value_return (result_rtl);
3591 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3592 register, tell the rtl optimizers that its value is no longer
3593 needed. */
3595 static void
3596 expand_clobber (tree lhs)
3598 if (DECL_P (lhs))
3600 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3601 if (decl_rtl && REG_P (decl_rtl))
3603 machine_mode decl_mode = GET_MODE (decl_rtl);
3604 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3605 REGMODE_NATURAL_SIZE (decl_mode)))
3606 emit_clobber (decl_rtl);
3611 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3612 STMT that doesn't require special handling for outgoing edges. That
3613 is no tailcalls and no GIMPLE_COND. */
3615 static void
3616 expand_gimple_stmt_1 (gimple *stmt)
3618 tree op0;
3620 set_curr_insn_location (gimple_location (stmt));
3622 switch (gimple_code (stmt))
3624 case GIMPLE_GOTO:
3625 op0 = gimple_goto_dest (stmt);
3626 if (TREE_CODE (op0) == LABEL_DECL)
3627 expand_goto (op0);
3628 else
3629 expand_computed_goto (op0);
3630 break;
3631 case GIMPLE_LABEL:
3632 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3633 break;
3634 case GIMPLE_NOP:
3635 case GIMPLE_PREDICT:
3636 break;
3637 case GIMPLE_SWITCH:
3639 gswitch *swtch = as_a <gswitch *> (stmt);
3640 if (gimple_switch_num_labels (swtch) == 1)
3641 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3642 else
3643 expand_case (swtch);
3645 break;
3646 case GIMPLE_ASM:
3647 expand_asm_stmt (as_a <gasm *> (stmt));
3648 break;
3649 case GIMPLE_CALL:
3650 expand_call_stmt (as_a <gcall *> (stmt));
3651 break;
3653 case GIMPLE_RETURN:
3655 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3657 if (op0 && op0 != error_mark_node)
3659 tree result = DECL_RESULT (current_function_decl);
3661 /* If we are not returning the current function's RESULT_DECL,
3662 build an assignment to it. */
3663 if (op0 != result)
3665 /* I believe that a function's RESULT_DECL is unique. */
3666 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3668 /* ??? We'd like to use simply expand_assignment here,
3669 but this fails if the value is of BLKmode but the return
3670 decl is a register. expand_return has special handling
3671 for this combination, which eventually should move
3672 to common code. See comments there. Until then, let's
3673 build a modify expression :-/ */
3674 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3675 result, op0);
3679 if (!op0)
3680 expand_null_return ();
3681 else
3682 expand_return (op0);
3684 break;
3686 case GIMPLE_ASSIGN:
3688 gassign *assign_stmt = as_a <gassign *> (stmt);
3689 tree lhs = gimple_assign_lhs (assign_stmt);
3691 /* Tree expand used to fiddle with |= and &= of two bitfield
3692 COMPONENT_REFs here. This can't happen with gimple, the LHS
3693 of binary assigns must be a gimple reg. */
3695 if (TREE_CODE (lhs) != SSA_NAME
3696 || get_gimple_rhs_class (gimple_expr_code (stmt))
3697 == GIMPLE_SINGLE_RHS)
3699 tree rhs = gimple_assign_rhs1 (assign_stmt);
3700 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt))
3701 == GIMPLE_SINGLE_RHS);
3702 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3703 /* Do not put locations on possibly shared trees. */
3704 && !is_gimple_min_invariant (rhs))
3705 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3706 if (TREE_CLOBBER_P (rhs))
3707 /* This is a clobber to mark the going out of scope for
3708 this LHS. */
3709 expand_clobber (lhs);
3710 else
3711 expand_assignment (lhs, rhs,
3712 gimple_assign_nontemporal_move_p (
3713 assign_stmt));
3715 else
3717 rtx target, temp;
3718 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3719 struct separate_ops ops;
3720 bool promoted = false;
3722 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3723 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3724 promoted = true;
3726 ops.code = gimple_assign_rhs_code (assign_stmt);
3727 ops.type = TREE_TYPE (lhs);
3728 switch (get_gimple_rhs_class (ops.code))
3730 case GIMPLE_TERNARY_RHS:
3731 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3732 /* Fallthru */
3733 case GIMPLE_BINARY_RHS:
3734 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3735 /* Fallthru */
3736 case GIMPLE_UNARY_RHS:
3737 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3738 break;
3739 default:
3740 gcc_unreachable ();
3742 ops.location = gimple_location (stmt);
3744 /* If we want to use a nontemporal store, force the value to
3745 register first. If we store into a promoted register,
3746 don't directly expand to target. */
3747 temp = nontemporal || promoted ? NULL_RTX : target;
3748 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3749 EXPAND_NORMAL);
3751 if (temp == target)
3753 else if (promoted)
3755 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3756 /* If TEMP is a VOIDmode constant, use convert_modes to make
3757 sure that we properly convert it. */
3758 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3760 temp = convert_modes (GET_MODE (target),
3761 TYPE_MODE (ops.type),
3762 temp, unsignedp);
3763 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3764 GET_MODE (target), temp, unsignedp);
3767 convert_move (SUBREG_REG (target), temp, unsignedp);
3769 else if (nontemporal && emit_storent_insn (target, temp))
3771 else
3773 temp = force_operand (temp, target);
3774 if (temp != target)
3775 emit_move_insn (target, temp);
3779 break;
3781 default:
3782 gcc_unreachable ();
3786 /* Expand one gimple statement STMT and return the last RTL instruction
3787 before any of the newly generated ones.
3789 In addition to generating the necessary RTL instructions this also
3790 sets REG_EH_REGION notes if necessary and sets the current source
3791 location for diagnostics. */
3793 static rtx_insn *
3794 expand_gimple_stmt (gimple *stmt)
3796 location_t saved_location = input_location;
3797 rtx_insn *last = get_last_insn ();
3798 int lp_nr;
3800 gcc_assert (cfun);
3802 /* We need to save and restore the current source location so that errors
3803 discovered during expansion are emitted with the right location. But
3804 it would be better if the diagnostic routines used the source location
3805 embedded in the tree nodes rather than globals. */
3806 if (gimple_has_location (stmt))
3807 input_location = gimple_location (stmt);
3809 expand_gimple_stmt_1 (stmt);
3811 /* Free any temporaries used to evaluate this statement. */
3812 free_temp_slots ();
3814 input_location = saved_location;
3816 /* Mark all insns that may trap. */
3817 lp_nr = lookup_stmt_eh_lp (stmt);
3818 if (lp_nr)
3820 rtx_insn *insn;
3821 for (insn = next_real_insn (last); insn;
3822 insn = next_real_insn (insn))
3824 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3825 /* If we want exceptions for non-call insns, any
3826 may_trap_p instruction may throw. */
3827 && GET_CODE (PATTERN (insn)) != CLOBBER
3828 && GET_CODE (PATTERN (insn)) != CLOBBER_HIGH
3829 && GET_CODE (PATTERN (insn)) != USE
3830 && insn_could_throw_p (insn))
3831 make_reg_eh_region_note (insn, 0, lp_nr);
3835 return last;
3838 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3839 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3840 generated a tail call (something that might be denied by the ABI
3841 rules governing the call; see calls.c).
3843 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3844 can still reach the rest of BB. The case here is __builtin_sqrt,
3845 where the NaN result goes through the external function (with a
3846 tailcall) and the normal result happens via a sqrt instruction. */
3848 static basic_block
3849 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
3851 rtx_insn *last2, *last;
3852 edge e;
3853 edge_iterator ei;
3854 profile_probability probability;
3856 last2 = last = expand_gimple_stmt (stmt);
3858 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3859 if (CALL_P (last) && SIBLING_CALL_P (last))
3860 goto found;
3862 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3864 *can_fallthru = true;
3865 return NULL;
3867 found:
3868 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3869 Any instructions emitted here are about to be deleted. */
3870 do_pending_stack_adjust ();
3872 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3873 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3874 EH or abnormal edges, we shouldn't have created a tail call in
3875 the first place. So it seems to me we should just be removing
3876 all edges here, or redirecting the existing fallthru edge to
3877 the exit block. */
3879 probability = profile_probability::never ();
3881 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3883 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3885 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3886 e->dest->count -= e->count ();
3887 probability += e->probability;
3888 remove_edge (e);
3890 else
3891 ei_next (&ei);
3894 /* This is somewhat ugly: the call_expr expander often emits instructions
3895 after the sibcall (to perform the function return). These confuse the
3896 find_many_sub_basic_blocks code, so we need to get rid of these. */
3897 last = NEXT_INSN (last);
3898 gcc_assert (BARRIER_P (last));
3900 *can_fallthru = false;
3901 while (NEXT_INSN (last))
3903 /* For instance an sqrt builtin expander expands if with
3904 sibcall in the then and label for `else`. */
3905 if (LABEL_P (NEXT_INSN (last)))
3907 *can_fallthru = true;
3908 break;
3910 delete_insn (NEXT_INSN (last));
3913 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3914 | EDGE_SIBCALL);
3915 e->probability = probability;
3916 BB_END (bb) = last;
3917 update_bb_for_insn (bb);
3919 if (NEXT_INSN (last))
3921 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3923 last = BB_END (bb);
3924 if (BARRIER_P (last))
3925 BB_END (bb) = PREV_INSN (last);
3928 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3930 return bb;
3933 /* Return the difference between the floor and the truncated result of
3934 a signed division by OP1 with remainder MOD. */
3935 static rtx
3936 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3938 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
3939 return gen_rtx_IF_THEN_ELSE
3940 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3941 gen_rtx_IF_THEN_ELSE
3942 (mode, gen_rtx_LT (BImode,
3943 gen_rtx_DIV (mode, op1, mod),
3944 const0_rtx),
3945 constm1_rtx, const0_rtx),
3946 const0_rtx);
3949 /* Return the difference between the ceil and the truncated result of
3950 a signed division by OP1 with remainder MOD. */
3951 static rtx
3952 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3954 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
3955 return gen_rtx_IF_THEN_ELSE
3956 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3957 gen_rtx_IF_THEN_ELSE
3958 (mode, gen_rtx_GT (BImode,
3959 gen_rtx_DIV (mode, op1, mod),
3960 const0_rtx),
3961 const1_rtx, const0_rtx),
3962 const0_rtx);
3965 /* Return the difference between the ceil and the truncated result of
3966 an unsigned division by OP1 with remainder MOD. */
3967 static rtx
3968 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
3970 /* (mod != 0 ? 1 : 0) */
3971 return gen_rtx_IF_THEN_ELSE
3972 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3973 const1_rtx, const0_rtx);
3976 /* Return the difference between the rounded and the truncated result
3977 of a signed division by OP1 with remainder MOD. Halfway cases are
3978 rounded away from zero, rather than to the nearest even number. */
3979 static rtx
3980 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3982 /* (abs (mod) >= abs (op1) - abs (mod)
3983 ? (op1 / mod > 0 ? 1 : -1)
3984 : 0) */
3985 return gen_rtx_IF_THEN_ELSE
3986 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
3987 gen_rtx_MINUS (mode,
3988 gen_rtx_ABS (mode, op1),
3989 gen_rtx_ABS (mode, mod))),
3990 gen_rtx_IF_THEN_ELSE
3991 (mode, gen_rtx_GT (BImode,
3992 gen_rtx_DIV (mode, op1, mod),
3993 const0_rtx),
3994 const1_rtx, constm1_rtx),
3995 const0_rtx);
3998 /* Return the difference between the rounded and the truncated result
3999 of a unsigned division by OP1 with remainder MOD. Halfway cases
4000 are rounded away from zero, rather than to the nearest even
4001 number. */
4002 static rtx
4003 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
4005 /* (mod >= op1 - mod ? 1 : 0) */
4006 return gen_rtx_IF_THEN_ELSE
4007 (mode, gen_rtx_GE (BImode, mod,
4008 gen_rtx_MINUS (mode, op1, mod)),
4009 const1_rtx, const0_rtx);
4012 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
4013 any rtl. */
4015 static rtx
4016 convert_debug_memory_address (scalar_int_mode mode, rtx x,
4017 addr_space_t as)
4019 #ifndef POINTERS_EXTEND_UNSIGNED
4020 gcc_assert (mode == Pmode
4021 || mode == targetm.addr_space.address_mode (as));
4022 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
4023 #else
4024 rtx temp;
4026 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
4028 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
4029 return x;
4031 /* X must have some form of address mode already. */
4032 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
4033 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
4034 x = lowpart_subreg (mode, x, xmode);
4035 else if (POINTERS_EXTEND_UNSIGNED > 0)
4036 x = gen_rtx_ZERO_EXTEND (mode, x);
4037 else if (!POINTERS_EXTEND_UNSIGNED)
4038 x = gen_rtx_SIGN_EXTEND (mode, x);
4039 else
4041 switch (GET_CODE (x))
4043 case SUBREG:
4044 if ((SUBREG_PROMOTED_VAR_P (x)
4045 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
4046 || (GET_CODE (SUBREG_REG (x)) == PLUS
4047 && REG_P (XEXP (SUBREG_REG (x), 0))
4048 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
4049 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
4050 && GET_MODE (SUBREG_REG (x)) == mode)
4051 return SUBREG_REG (x);
4052 break;
4053 case LABEL_REF:
4054 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4055 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4056 return temp;
4057 case SYMBOL_REF:
4058 temp = shallow_copy_rtx (x);
4059 PUT_MODE (temp, mode);
4060 return temp;
4061 case CONST:
4062 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4063 if (temp)
4064 temp = gen_rtx_CONST (mode, temp);
4065 return temp;
4066 case PLUS:
4067 case MINUS:
4068 if (CONST_INT_P (XEXP (x, 1)))
4070 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4071 if (temp)
4072 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4074 break;
4075 default:
4076 break;
4078 /* Don't know how to express ptr_extend as operation in debug info. */
4079 return NULL;
4081 #endif /* POINTERS_EXTEND_UNSIGNED */
4083 return x;
4086 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4087 by avoid_deep_ter_for_debug. */
4089 static hash_map<tree, tree> *deep_ter_debug_map;
4091 /* Split too deep TER chains for debug stmts using debug temporaries. */
4093 static void
4094 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4096 use_operand_p use_p;
4097 ssa_op_iter iter;
4098 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4100 tree use = USE_FROM_PTR (use_p);
4101 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4102 continue;
4103 gimple *g = get_gimple_for_ssa_name (use);
4104 if (g == NULL)
4105 continue;
4106 if (depth > 6 && !stmt_ends_bb_p (g))
4108 if (deep_ter_debug_map == NULL)
4109 deep_ter_debug_map = new hash_map<tree, tree>;
4111 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4112 if (vexpr != NULL)
4113 continue;
4114 vexpr = make_node (DEBUG_EXPR_DECL);
4115 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4116 DECL_ARTIFICIAL (vexpr) = 1;
4117 TREE_TYPE (vexpr) = TREE_TYPE (use);
4118 SET_DECL_MODE (vexpr, TYPE_MODE (TREE_TYPE (use)));
4119 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4120 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4121 avoid_deep_ter_for_debug (def_temp, 0);
4123 else
4124 avoid_deep_ter_for_debug (g, depth + 1);
4128 /* Return an RTX equivalent to the value of the parameter DECL. */
4130 static rtx
4131 expand_debug_parm_decl (tree decl)
4133 rtx incoming = DECL_INCOMING_RTL (decl);
4135 if (incoming
4136 && GET_MODE (incoming) != BLKmode
4137 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4138 || (MEM_P (incoming)
4139 && REG_P (XEXP (incoming, 0))
4140 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4142 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4144 #ifdef HAVE_window_save
4145 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4146 If the target machine has an explicit window save instruction, the
4147 actual entry value is the corresponding OUTGOING_REGNO instead. */
4148 if (REG_P (incoming)
4149 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4150 incoming
4151 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4152 OUTGOING_REGNO (REGNO (incoming)), 0);
4153 else if (MEM_P (incoming))
4155 rtx reg = XEXP (incoming, 0);
4156 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4158 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4159 incoming = replace_equiv_address_nv (incoming, reg);
4161 else
4162 incoming = copy_rtx (incoming);
4164 #endif
4166 ENTRY_VALUE_EXP (rtl) = incoming;
4167 return rtl;
4170 if (incoming
4171 && GET_MODE (incoming) != BLKmode
4172 && !TREE_ADDRESSABLE (decl)
4173 && MEM_P (incoming)
4174 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4175 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4176 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4177 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4178 return copy_rtx (incoming);
4180 return NULL_RTX;
4183 /* Return an RTX equivalent to the value of the tree expression EXP. */
4185 static rtx
4186 expand_debug_expr (tree exp)
4188 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4189 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4190 machine_mode inner_mode = VOIDmode;
4191 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4192 addr_space_t as;
4193 scalar_int_mode op0_mode, op1_mode, addr_mode;
4195 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4197 case tcc_expression:
4198 switch (TREE_CODE (exp))
4200 case COND_EXPR:
4201 case DOT_PROD_EXPR:
4202 case SAD_EXPR:
4203 case WIDEN_MULT_PLUS_EXPR:
4204 case WIDEN_MULT_MINUS_EXPR:
4205 goto ternary;
4207 case TRUTH_ANDIF_EXPR:
4208 case TRUTH_ORIF_EXPR:
4209 case TRUTH_AND_EXPR:
4210 case TRUTH_OR_EXPR:
4211 case TRUTH_XOR_EXPR:
4212 goto binary;
4214 case TRUTH_NOT_EXPR:
4215 goto unary;
4217 default:
4218 break;
4220 break;
4222 ternary:
4223 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4224 if (!op2)
4225 return NULL_RTX;
4226 /* Fall through. */
4228 binary:
4229 case tcc_binary:
4230 if (mode == BLKmode)
4231 return NULL_RTX;
4232 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4233 if (!op1)
4234 return NULL_RTX;
4235 switch (TREE_CODE (exp))
4237 case LSHIFT_EXPR:
4238 case RSHIFT_EXPR:
4239 case LROTATE_EXPR:
4240 case RROTATE_EXPR:
4241 case WIDEN_LSHIFT_EXPR:
4242 /* Ensure second operand isn't wider than the first one. */
4243 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4244 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4245 && (GET_MODE_UNIT_PRECISION (mode)
4246 < GET_MODE_PRECISION (op1_mode)))
4247 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4248 break;
4249 default:
4250 break;
4252 /* Fall through. */
4254 unary:
4255 case tcc_unary:
4256 if (mode == BLKmode)
4257 return NULL_RTX;
4258 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4259 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4260 if (!op0)
4261 return NULL_RTX;
4262 break;
4264 case tcc_comparison:
4265 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4266 goto binary;
4268 case tcc_type:
4269 case tcc_statement:
4270 gcc_unreachable ();
4272 case tcc_constant:
4273 case tcc_exceptional:
4274 case tcc_declaration:
4275 case tcc_reference:
4276 case tcc_vl_exp:
4277 break;
4280 switch (TREE_CODE (exp))
4282 case STRING_CST:
4283 if (!lookup_constant_def (exp))
4285 if (strlen (TREE_STRING_POINTER (exp)) + 1
4286 != (size_t) TREE_STRING_LENGTH (exp))
4287 return NULL_RTX;
4288 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4289 op0 = gen_rtx_MEM (BLKmode, op0);
4290 set_mem_attributes (op0, exp, 0);
4291 return op0;
4293 /* Fall through. */
4295 case INTEGER_CST:
4296 case REAL_CST:
4297 case FIXED_CST:
4298 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4299 return op0;
4301 case POLY_INT_CST:
4302 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4304 case COMPLEX_CST:
4305 gcc_assert (COMPLEX_MODE_P (mode));
4306 op0 = expand_debug_expr (TREE_REALPART (exp));
4307 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4308 return gen_rtx_CONCAT (mode, op0, op1);
4310 case DEBUG_EXPR_DECL:
4311 op0 = DECL_RTL_IF_SET (exp);
4313 if (op0)
4314 return op0;
4316 op0 = gen_rtx_DEBUG_EXPR (mode);
4317 DEBUG_EXPR_TREE_DECL (op0) = exp;
4318 SET_DECL_RTL (exp, op0);
4320 return op0;
4322 case VAR_DECL:
4323 case PARM_DECL:
4324 case FUNCTION_DECL:
4325 case LABEL_DECL:
4326 case CONST_DECL:
4327 case RESULT_DECL:
4328 op0 = DECL_RTL_IF_SET (exp);
4330 /* This decl was probably optimized away. */
4331 if (!op0)
4333 if (!VAR_P (exp)
4334 || DECL_EXTERNAL (exp)
4335 || !TREE_STATIC (exp)
4336 || !DECL_NAME (exp)
4337 || DECL_HARD_REGISTER (exp)
4338 || DECL_IN_CONSTANT_POOL (exp)
4339 || mode == VOIDmode)
4340 return NULL;
4342 op0 = make_decl_rtl_for_debug (exp);
4343 if (!MEM_P (op0)
4344 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4345 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4346 return NULL;
4348 else
4349 op0 = copy_rtx (op0);
4351 if (GET_MODE (op0) == BLKmode
4352 /* If op0 is not BLKmode, but mode is, adjust_mode
4353 below would ICE. While it is likely a FE bug,
4354 try to be robust here. See PR43166. */
4355 || mode == BLKmode
4356 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4358 gcc_assert (MEM_P (op0));
4359 op0 = adjust_address_nv (op0, mode, 0);
4360 return op0;
4363 /* Fall through. */
4365 adjust_mode:
4366 case PAREN_EXPR:
4367 CASE_CONVERT:
4369 inner_mode = GET_MODE (op0);
4371 if (mode == inner_mode)
4372 return op0;
4374 if (inner_mode == VOIDmode)
4376 if (TREE_CODE (exp) == SSA_NAME)
4377 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4378 else
4379 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4380 if (mode == inner_mode)
4381 return op0;
4384 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4386 if (GET_MODE_UNIT_BITSIZE (mode)
4387 == GET_MODE_UNIT_BITSIZE (inner_mode))
4388 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4389 else if (GET_MODE_UNIT_BITSIZE (mode)
4390 < GET_MODE_UNIT_BITSIZE (inner_mode))
4391 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4392 else
4393 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4395 else if (FLOAT_MODE_P (mode))
4397 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4398 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4399 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4400 else
4401 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4403 else if (FLOAT_MODE_P (inner_mode))
4405 if (unsignedp)
4406 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4407 else
4408 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4410 else if (GET_MODE_UNIT_PRECISION (mode)
4411 == GET_MODE_UNIT_PRECISION (inner_mode))
4412 op0 = lowpart_subreg (mode, op0, inner_mode);
4413 else if (GET_MODE_UNIT_PRECISION (mode)
4414 < GET_MODE_UNIT_PRECISION (inner_mode))
4415 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4416 else if (UNARY_CLASS_P (exp)
4417 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4418 : unsignedp)
4419 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4420 else
4421 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4423 return op0;
4426 case MEM_REF:
4427 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4429 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4430 TREE_OPERAND (exp, 0),
4431 TREE_OPERAND (exp, 1));
4432 if (newexp)
4433 return expand_debug_expr (newexp);
4435 /* FALLTHROUGH */
4436 case INDIRECT_REF:
4437 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4438 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4439 if (!op0)
4440 return NULL;
4442 if (TREE_CODE (exp) == MEM_REF)
4444 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4445 || (GET_CODE (op0) == PLUS
4446 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4447 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4448 Instead just use get_inner_reference. */
4449 goto component_ref;
4451 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4452 poly_int64 offset;
4453 if (!op1 || !poly_int_rtx_p (op1, &offset))
4454 return NULL;
4456 op0 = plus_constant (inner_mode, op0, offset);
4459 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4461 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4462 op0, as);
4463 if (op0 == NULL_RTX)
4464 return NULL;
4466 op0 = gen_rtx_MEM (mode, op0);
4467 set_mem_attributes (op0, exp, 0);
4468 if (TREE_CODE (exp) == MEM_REF
4469 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4470 set_mem_expr (op0, NULL_TREE);
4471 set_mem_addr_space (op0, as);
4473 return op0;
4475 case TARGET_MEM_REF:
4476 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4477 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4478 return NULL;
4480 op0 = expand_debug_expr
4481 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4482 if (!op0)
4483 return NULL;
4485 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4486 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4487 op0, as);
4488 if (op0 == NULL_RTX)
4489 return NULL;
4491 op0 = gen_rtx_MEM (mode, op0);
4493 set_mem_attributes (op0, exp, 0);
4494 set_mem_addr_space (op0, as);
4496 return op0;
4498 component_ref:
4499 case ARRAY_REF:
4500 case ARRAY_RANGE_REF:
4501 case COMPONENT_REF:
4502 case BIT_FIELD_REF:
4503 case REALPART_EXPR:
4504 case IMAGPART_EXPR:
4505 case VIEW_CONVERT_EXPR:
4507 machine_mode mode1;
4508 poly_int64 bitsize, bitpos;
4509 tree offset;
4510 int reversep, volatilep = 0;
4511 tree tem
4512 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4513 &unsignedp, &reversep, &volatilep);
4514 rtx orig_op0;
4516 if (known_eq (bitsize, 0))
4517 return NULL;
4519 orig_op0 = op0 = expand_debug_expr (tem);
4521 if (!op0)
4522 return NULL;
4524 if (offset)
4526 machine_mode addrmode, offmode;
4528 if (!MEM_P (op0))
4529 return NULL;
4531 op0 = XEXP (op0, 0);
4532 addrmode = GET_MODE (op0);
4533 if (addrmode == VOIDmode)
4534 addrmode = Pmode;
4536 op1 = expand_debug_expr (offset);
4537 if (!op1)
4538 return NULL;
4540 offmode = GET_MODE (op1);
4541 if (offmode == VOIDmode)
4542 offmode = TYPE_MODE (TREE_TYPE (offset));
4544 if (addrmode != offmode)
4545 op1 = lowpart_subreg (addrmode, op1, offmode);
4547 /* Don't use offset_address here, we don't need a
4548 recognizable address, and we don't want to generate
4549 code. */
4550 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4551 op0, op1));
4554 if (MEM_P (op0))
4556 if (mode1 == VOIDmode)
4558 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4559 return NULL;
4560 /* Bitfield. */
4561 mode1 = smallest_int_mode_for_size (bitsize);
4563 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4564 if (maybe_ne (bytepos, 0))
4566 op0 = adjust_address_nv (op0, mode1, bytepos);
4567 bitpos = num_trailing_bits (bitpos);
4569 else if (known_eq (bitpos, 0)
4570 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4571 op0 = adjust_address_nv (op0, mode, 0);
4572 else if (GET_MODE (op0) != mode1)
4573 op0 = adjust_address_nv (op0, mode1, 0);
4574 else
4575 op0 = copy_rtx (op0);
4576 if (op0 == orig_op0)
4577 op0 = shallow_copy_rtx (op0);
4578 set_mem_attributes (op0, exp, 0);
4581 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4582 return op0;
4584 if (maybe_lt (bitpos, 0))
4585 return NULL;
4587 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4588 return NULL;
4590 poly_int64 bytepos;
4591 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4592 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4594 machine_mode opmode = GET_MODE (op0);
4596 if (opmode == VOIDmode)
4597 opmode = TYPE_MODE (TREE_TYPE (tem));
4599 /* This condition may hold if we're expanding the address
4600 right past the end of an array that turned out not to
4601 be addressable (i.e., the address was only computed in
4602 debug stmts). The gen_subreg below would rightfully
4603 crash, and the address doesn't really exist, so just
4604 drop it. */
4605 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4606 return NULL;
4608 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4609 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4612 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4613 && TYPE_UNSIGNED (TREE_TYPE (exp))
4614 ? SIGN_EXTRACT
4615 : ZERO_EXTRACT, mode,
4616 GET_MODE (op0) != VOIDmode
4617 ? GET_MODE (op0)
4618 : TYPE_MODE (TREE_TYPE (tem)),
4619 op0, gen_int_mode (bitsize, word_mode),
4620 gen_int_mode (bitpos, word_mode));
4623 case ABS_EXPR:
4624 case ABSU_EXPR:
4625 return simplify_gen_unary (ABS, mode, op0, mode);
4627 case NEGATE_EXPR:
4628 return simplify_gen_unary (NEG, mode, op0, mode);
4630 case BIT_NOT_EXPR:
4631 return simplify_gen_unary (NOT, mode, op0, mode);
4633 case FLOAT_EXPR:
4634 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4635 0)))
4636 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4637 inner_mode);
4639 case FIX_TRUNC_EXPR:
4640 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4641 inner_mode);
4643 case POINTER_PLUS_EXPR:
4644 /* For the rare target where pointers are not the same size as
4645 size_t, we need to check for mis-matched modes and correct
4646 the addend. */
4647 if (op0 && op1
4648 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4649 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4650 && op0_mode != op1_mode)
4652 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4653 /* If OP0 is a partial mode, then we must truncate, even
4654 if it has the same bitsize as OP1 as GCC's
4655 representation of partial modes is opaque. */
4656 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4657 && (GET_MODE_BITSIZE (op0_mode)
4658 == GET_MODE_BITSIZE (op1_mode))))
4659 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4660 else
4661 /* We always sign-extend, regardless of the signedness of
4662 the operand, because the operand is always unsigned
4663 here even if the original C expression is signed. */
4664 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4666 /* Fall through. */
4667 case PLUS_EXPR:
4668 return simplify_gen_binary (PLUS, mode, op0, op1);
4670 case MINUS_EXPR:
4671 case POINTER_DIFF_EXPR:
4672 return simplify_gen_binary (MINUS, mode, op0, op1);
4674 case MULT_EXPR:
4675 return simplify_gen_binary (MULT, mode, op0, op1);
4677 case RDIV_EXPR:
4678 case TRUNC_DIV_EXPR:
4679 case EXACT_DIV_EXPR:
4680 if (unsignedp)
4681 return simplify_gen_binary (UDIV, mode, op0, op1);
4682 else
4683 return simplify_gen_binary (DIV, mode, op0, op1);
4685 case TRUNC_MOD_EXPR:
4686 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4688 case FLOOR_DIV_EXPR:
4689 if (unsignedp)
4690 return simplify_gen_binary (UDIV, mode, op0, op1);
4691 else
4693 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4694 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4695 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4696 return simplify_gen_binary (PLUS, mode, div, adj);
4699 case FLOOR_MOD_EXPR:
4700 if (unsignedp)
4701 return simplify_gen_binary (UMOD, mode, op0, op1);
4702 else
4704 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4705 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4706 adj = simplify_gen_unary (NEG, mode,
4707 simplify_gen_binary (MULT, mode, adj, op1),
4708 mode);
4709 return simplify_gen_binary (PLUS, mode, mod, adj);
4712 case CEIL_DIV_EXPR:
4713 if (unsignedp)
4715 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4716 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4717 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4718 return simplify_gen_binary (PLUS, mode, div, adj);
4720 else
4722 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4723 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4724 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4725 return simplify_gen_binary (PLUS, mode, div, adj);
4728 case CEIL_MOD_EXPR:
4729 if (unsignedp)
4731 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4732 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4733 adj = simplify_gen_unary (NEG, mode,
4734 simplify_gen_binary (MULT, mode, adj, op1),
4735 mode);
4736 return simplify_gen_binary (PLUS, mode, mod, adj);
4738 else
4740 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4741 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4742 adj = simplify_gen_unary (NEG, mode,
4743 simplify_gen_binary (MULT, mode, adj, op1),
4744 mode);
4745 return simplify_gen_binary (PLUS, mode, mod, adj);
4748 case ROUND_DIV_EXPR:
4749 if (unsignedp)
4751 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4752 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4753 rtx adj = round_udiv_adjust (mode, mod, op1);
4754 return simplify_gen_binary (PLUS, mode, div, adj);
4756 else
4758 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4759 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4760 rtx adj = round_sdiv_adjust (mode, mod, op1);
4761 return simplify_gen_binary (PLUS, mode, div, adj);
4764 case ROUND_MOD_EXPR:
4765 if (unsignedp)
4767 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4768 rtx adj = round_udiv_adjust (mode, mod, op1);
4769 adj = simplify_gen_unary (NEG, mode,
4770 simplify_gen_binary (MULT, mode, adj, op1),
4771 mode);
4772 return simplify_gen_binary (PLUS, mode, mod, adj);
4774 else
4776 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4777 rtx adj = round_sdiv_adjust (mode, mod, op1);
4778 adj = simplify_gen_unary (NEG, mode,
4779 simplify_gen_binary (MULT, mode, adj, op1),
4780 mode);
4781 return simplify_gen_binary (PLUS, mode, mod, adj);
4784 case LSHIFT_EXPR:
4785 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4787 case RSHIFT_EXPR:
4788 if (unsignedp)
4789 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4790 else
4791 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4793 case LROTATE_EXPR:
4794 return simplify_gen_binary (ROTATE, mode, op0, op1);
4796 case RROTATE_EXPR:
4797 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4799 case MIN_EXPR:
4800 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4802 case MAX_EXPR:
4803 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4805 case BIT_AND_EXPR:
4806 case TRUTH_AND_EXPR:
4807 return simplify_gen_binary (AND, mode, op0, op1);
4809 case BIT_IOR_EXPR:
4810 case TRUTH_OR_EXPR:
4811 return simplify_gen_binary (IOR, mode, op0, op1);
4813 case BIT_XOR_EXPR:
4814 case TRUTH_XOR_EXPR:
4815 return simplify_gen_binary (XOR, mode, op0, op1);
4817 case TRUTH_ANDIF_EXPR:
4818 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4820 case TRUTH_ORIF_EXPR:
4821 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4823 case TRUTH_NOT_EXPR:
4824 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4826 case LT_EXPR:
4827 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4828 op0, op1);
4830 case LE_EXPR:
4831 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4832 op0, op1);
4834 case GT_EXPR:
4835 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4836 op0, op1);
4838 case GE_EXPR:
4839 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4840 op0, op1);
4842 case EQ_EXPR:
4843 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4845 case NE_EXPR:
4846 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4848 case UNORDERED_EXPR:
4849 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4851 case ORDERED_EXPR:
4852 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4854 case UNLT_EXPR:
4855 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4857 case UNLE_EXPR:
4858 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4860 case UNGT_EXPR:
4861 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4863 case UNGE_EXPR:
4864 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4866 case UNEQ_EXPR:
4867 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4869 case LTGT_EXPR:
4870 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4872 case COND_EXPR:
4873 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4875 case COMPLEX_EXPR:
4876 gcc_assert (COMPLEX_MODE_P (mode));
4877 if (GET_MODE (op0) == VOIDmode)
4878 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4879 if (GET_MODE (op1) == VOIDmode)
4880 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4881 return gen_rtx_CONCAT (mode, op0, op1);
4883 case CONJ_EXPR:
4884 if (GET_CODE (op0) == CONCAT)
4885 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4886 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4887 XEXP (op0, 1),
4888 GET_MODE_INNER (mode)));
4889 else
4891 scalar_mode imode = GET_MODE_INNER (mode);
4892 rtx re, im;
4894 if (MEM_P (op0))
4896 re = adjust_address_nv (op0, imode, 0);
4897 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4899 else
4901 scalar_int_mode ifmode;
4902 scalar_int_mode ihmode;
4903 rtx halfsize;
4904 if (!int_mode_for_mode (mode).exists (&ifmode)
4905 || !int_mode_for_mode (imode).exists (&ihmode))
4906 return NULL;
4907 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4908 re = op0;
4909 if (mode != ifmode)
4910 re = gen_rtx_SUBREG (ifmode, re, 0);
4911 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4912 if (imode != ihmode)
4913 re = gen_rtx_SUBREG (imode, re, 0);
4914 im = copy_rtx (op0);
4915 if (mode != ifmode)
4916 im = gen_rtx_SUBREG (ifmode, im, 0);
4917 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4918 if (imode != ihmode)
4919 im = gen_rtx_SUBREG (imode, im, 0);
4921 im = gen_rtx_NEG (imode, im);
4922 return gen_rtx_CONCAT (mode, re, im);
4925 case ADDR_EXPR:
4926 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4927 if (!op0 || !MEM_P (op0))
4929 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
4930 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
4931 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
4932 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
4933 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
4934 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
4936 if (handled_component_p (TREE_OPERAND (exp, 0)))
4938 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
4939 bool reverse;
4940 tree decl
4941 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
4942 &bitsize, &maxsize, &reverse);
4943 if ((VAR_P (decl)
4944 || TREE_CODE (decl) == PARM_DECL
4945 || TREE_CODE (decl) == RESULT_DECL)
4946 && (!TREE_ADDRESSABLE (decl)
4947 || target_for_debug_bind (decl))
4948 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
4949 && known_gt (bitsize, 0)
4950 && known_eq (bitsize, maxsize))
4952 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
4953 return plus_constant (mode, base, byteoffset);
4957 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
4958 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
4959 == ADDR_EXPR)
4961 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4962 0));
4963 if (op0 != NULL
4964 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4965 || (GET_CODE (op0) == PLUS
4966 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
4967 && CONST_INT_P (XEXP (op0, 1)))))
4969 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4970 1));
4971 poly_int64 offset;
4972 if (!op1 || !poly_int_rtx_p (op1, &offset))
4973 return NULL;
4975 return plus_constant (mode, op0, offset);
4979 return NULL;
4982 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
4983 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
4984 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
4986 return op0;
4988 case VECTOR_CST:
4990 unsigned HOST_WIDE_INT i, nelts;
4992 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
4993 return NULL;
4995 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
4997 for (i = 0; i < nelts; ++i)
4999 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
5000 if (!op1)
5001 return NULL;
5002 XVECEXP (op0, 0, i) = op1;
5005 return op0;
5008 case CONSTRUCTOR:
5009 if (TREE_CLOBBER_P (exp))
5010 return NULL;
5011 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
5013 unsigned i;
5014 unsigned HOST_WIDE_INT nelts;
5015 tree val;
5017 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
5018 goto flag_unsupported;
5020 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5022 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
5024 op1 = expand_debug_expr (val);
5025 if (!op1)
5026 return NULL;
5027 XVECEXP (op0, 0, i) = op1;
5030 if (i < nelts)
5032 op1 = expand_debug_expr
5033 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
5035 if (!op1)
5036 return NULL;
5038 for (; i < nelts; i++)
5039 XVECEXP (op0, 0, i) = op1;
5042 return op0;
5044 else
5045 goto flag_unsupported;
5047 case CALL_EXPR:
5048 /* ??? Maybe handle some builtins? */
5049 return NULL;
5051 case SSA_NAME:
5053 gimple *g = get_gimple_for_ssa_name (exp);
5054 if (g)
5056 tree t = NULL_TREE;
5057 if (deep_ter_debug_map)
5059 tree *slot = deep_ter_debug_map->get (exp);
5060 if (slot)
5061 t = *slot;
5063 if (t == NULL_TREE)
5064 t = gimple_assign_rhs_to_tree (g);
5065 op0 = expand_debug_expr (t);
5066 if (!op0)
5067 return NULL;
5069 else
5071 /* If this is a reference to an incoming value of
5072 parameter that is never used in the code or where the
5073 incoming value is never used in the code, use
5074 PARM_DECL's DECL_RTL if set. */
5075 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5076 && SSA_NAME_VAR (exp)
5077 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5078 && has_zero_uses (exp))
5080 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5081 if (op0)
5082 goto adjust_mode;
5083 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5084 if (op0)
5085 goto adjust_mode;
5088 int part = var_to_partition (SA.map, exp);
5090 if (part == NO_PARTITION)
5091 return NULL;
5093 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5095 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5097 goto adjust_mode;
5100 case ERROR_MARK:
5101 return NULL;
5103 /* Vector stuff. For most of the codes we don't have rtl codes. */
5104 case REALIGN_LOAD_EXPR:
5105 case VEC_COND_EXPR:
5106 case VEC_PACK_FIX_TRUNC_EXPR:
5107 case VEC_PACK_FLOAT_EXPR:
5108 case VEC_PACK_SAT_EXPR:
5109 case VEC_PACK_TRUNC_EXPR:
5110 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5111 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5112 case VEC_UNPACK_FLOAT_HI_EXPR:
5113 case VEC_UNPACK_FLOAT_LO_EXPR:
5114 case VEC_UNPACK_HI_EXPR:
5115 case VEC_UNPACK_LO_EXPR:
5116 case VEC_WIDEN_MULT_HI_EXPR:
5117 case VEC_WIDEN_MULT_LO_EXPR:
5118 case VEC_WIDEN_MULT_EVEN_EXPR:
5119 case VEC_WIDEN_MULT_ODD_EXPR:
5120 case VEC_WIDEN_LSHIFT_HI_EXPR:
5121 case VEC_WIDEN_LSHIFT_LO_EXPR:
5122 case VEC_PERM_EXPR:
5123 case VEC_DUPLICATE_EXPR:
5124 case VEC_SERIES_EXPR:
5125 return NULL;
5127 /* Misc codes. */
5128 case ADDR_SPACE_CONVERT_EXPR:
5129 case FIXED_CONVERT_EXPR:
5130 case OBJ_TYPE_REF:
5131 case WITH_SIZE_EXPR:
5132 case BIT_INSERT_EXPR:
5133 return NULL;
5135 case DOT_PROD_EXPR:
5136 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5137 && SCALAR_INT_MODE_P (mode))
5140 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5141 0)))
5142 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5143 inner_mode);
5145 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5146 1)))
5147 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5148 inner_mode);
5149 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5150 return simplify_gen_binary (PLUS, mode, op0, op2);
5152 return NULL;
5154 case WIDEN_MULT_EXPR:
5155 case WIDEN_MULT_PLUS_EXPR:
5156 case WIDEN_MULT_MINUS_EXPR:
5157 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5158 && SCALAR_INT_MODE_P (mode))
5160 inner_mode = GET_MODE (op0);
5161 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5162 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5163 else
5164 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5165 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5166 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5167 else
5168 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5169 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5170 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5171 return op0;
5172 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5173 return simplify_gen_binary (PLUS, mode, op0, op2);
5174 else
5175 return simplify_gen_binary (MINUS, mode, op2, op0);
5177 return NULL;
5179 case MULT_HIGHPART_EXPR:
5180 /* ??? Similar to the above. */
5181 return NULL;
5183 case WIDEN_SUM_EXPR:
5184 case WIDEN_LSHIFT_EXPR:
5185 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5186 && SCALAR_INT_MODE_P (mode))
5189 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5190 0)))
5191 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5192 inner_mode);
5193 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5194 ? ASHIFT : PLUS, mode, op0, op1);
5196 return NULL;
5198 default:
5199 flag_unsupported:
5200 if (flag_checking)
5202 debug_tree (exp);
5203 gcc_unreachable ();
5205 return NULL;
5209 /* Return an RTX equivalent to the source bind value of the tree expression
5210 EXP. */
5212 static rtx
5213 expand_debug_source_expr (tree exp)
5215 rtx op0 = NULL_RTX;
5216 machine_mode mode = VOIDmode, inner_mode;
5218 switch (TREE_CODE (exp))
5220 case VAR_DECL:
5221 if (DECL_ABSTRACT_ORIGIN (exp))
5222 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5223 break;
5224 case PARM_DECL:
5226 mode = DECL_MODE (exp);
5227 op0 = expand_debug_parm_decl (exp);
5228 if (op0)
5229 break;
5230 /* See if this isn't an argument that has been completely
5231 optimized out. */
5232 if (!DECL_RTL_SET_P (exp)
5233 && !DECL_INCOMING_RTL (exp)
5234 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5236 tree aexp = DECL_ORIGIN (exp);
5237 if (DECL_CONTEXT (aexp)
5238 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5240 vec<tree, va_gc> **debug_args;
5241 unsigned int ix;
5242 tree ddecl;
5243 debug_args = decl_debug_args_lookup (current_function_decl);
5244 if (debug_args != NULL)
5246 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5247 ix += 2)
5248 if (ddecl == aexp)
5249 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5253 break;
5255 default:
5256 break;
5259 if (op0 == NULL_RTX)
5260 return NULL_RTX;
5262 inner_mode = GET_MODE (op0);
5263 if (mode == inner_mode)
5264 return op0;
5266 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5268 if (GET_MODE_UNIT_BITSIZE (mode)
5269 == GET_MODE_UNIT_BITSIZE (inner_mode))
5270 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5271 else if (GET_MODE_UNIT_BITSIZE (mode)
5272 < GET_MODE_UNIT_BITSIZE (inner_mode))
5273 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5274 else
5275 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5277 else if (FLOAT_MODE_P (mode))
5278 gcc_unreachable ();
5279 else if (FLOAT_MODE_P (inner_mode))
5281 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5282 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5283 else
5284 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5286 else if (GET_MODE_UNIT_PRECISION (mode)
5287 == GET_MODE_UNIT_PRECISION (inner_mode))
5288 op0 = lowpart_subreg (mode, op0, inner_mode);
5289 else if (GET_MODE_UNIT_PRECISION (mode)
5290 < GET_MODE_UNIT_PRECISION (inner_mode))
5291 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5292 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5293 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5294 else
5295 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5297 return op0;
5300 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5301 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5302 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5304 static void
5305 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5307 rtx exp = *exp_p;
5309 if (exp == NULL_RTX)
5310 return;
5312 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5313 return;
5315 if (depth == 4)
5317 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5318 rtx dval = make_debug_expr_from_rtl (exp);
5320 /* Emit a debug bind insn before INSN. */
5321 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5322 DEBUG_EXPR_TREE_DECL (dval), exp,
5323 VAR_INIT_STATUS_INITIALIZED);
5325 emit_debug_insn_before (bind, insn);
5326 *exp_p = dval;
5327 return;
5330 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5331 int i, j;
5332 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5333 switch (*format_ptr++)
5335 case 'e':
5336 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5337 break;
5339 case 'E':
5340 case 'V':
5341 for (j = 0; j < XVECLEN (exp, i); j++)
5342 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5343 break;
5345 default:
5346 break;
5350 /* Expand the _LOCs in debug insns. We run this after expanding all
5351 regular insns, so that any variables referenced in the function
5352 will have their DECL_RTLs set. */
5354 static void
5355 expand_debug_locations (void)
5357 rtx_insn *insn;
5358 rtx_insn *last = get_last_insn ();
5359 int save_strict_alias = flag_strict_aliasing;
5361 /* New alias sets while setting up memory attributes cause
5362 -fcompare-debug failures, even though it doesn't bring about any
5363 codegen changes. */
5364 flag_strict_aliasing = 0;
5366 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5367 if (DEBUG_BIND_INSN_P (insn))
5369 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5370 rtx val;
5371 rtx_insn *prev_insn, *insn2;
5372 machine_mode mode;
5374 if (value == NULL_TREE)
5375 val = NULL_RTX;
5376 else
5378 if (INSN_VAR_LOCATION_STATUS (insn)
5379 == VAR_INIT_STATUS_UNINITIALIZED)
5380 val = expand_debug_source_expr (value);
5381 /* The avoid_deep_ter_for_debug function inserts
5382 debug bind stmts after SSA_NAME definition, with the
5383 SSA_NAME as the whole bind location. Disable temporarily
5384 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5385 being defined in this DEBUG_INSN. */
5386 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5388 tree *slot = deep_ter_debug_map->get (value);
5389 if (slot)
5391 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5392 *slot = NULL_TREE;
5393 else
5394 slot = NULL;
5396 val = expand_debug_expr (value);
5397 if (slot)
5398 *slot = INSN_VAR_LOCATION_DECL (insn);
5400 else
5401 val = expand_debug_expr (value);
5402 gcc_assert (last == get_last_insn ());
5405 if (!val)
5406 val = gen_rtx_UNKNOWN_VAR_LOC ();
5407 else
5409 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5411 gcc_assert (mode == GET_MODE (val)
5412 || (GET_MODE (val) == VOIDmode
5413 && (CONST_SCALAR_INT_P (val)
5414 || GET_CODE (val) == CONST_FIXED
5415 || GET_CODE (val) == LABEL_REF)));
5418 INSN_VAR_LOCATION_LOC (insn) = val;
5419 prev_insn = PREV_INSN (insn);
5420 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5421 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5424 flag_strict_aliasing = save_strict_alias;
5427 /* Performs swapping operands of commutative operations to expand
5428 the expensive one first. */
5430 static void
5431 reorder_operands (basic_block bb)
5433 unsigned int *lattice; /* Hold cost of each statement. */
5434 unsigned int i = 0, n = 0;
5435 gimple_stmt_iterator gsi;
5436 gimple_seq stmts;
5437 gimple *stmt;
5438 bool swap;
5439 tree op0, op1;
5440 ssa_op_iter iter;
5441 use_operand_p use_p;
5442 gimple *def0, *def1;
5444 /* Compute cost of each statement using estimate_num_insns. */
5445 stmts = bb_seq (bb);
5446 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5448 stmt = gsi_stmt (gsi);
5449 if (!is_gimple_debug (stmt))
5450 gimple_set_uid (stmt, n++);
5452 lattice = XNEWVEC (unsigned int, n);
5453 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5455 unsigned cost;
5456 stmt = gsi_stmt (gsi);
5457 if (is_gimple_debug (stmt))
5458 continue;
5459 cost = estimate_num_insns (stmt, &eni_size_weights);
5460 lattice[i] = cost;
5461 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5463 tree use = USE_FROM_PTR (use_p);
5464 gimple *def_stmt;
5465 if (TREE_CODE (use) != SSA_NAME)
5466 continue;
5467 def_stmt = get_gimple_for_ssa_name (use);
5468 if (!def_stmt)
5469 continue;
5470 lattice[i] += lattice[gimple_uid (def_stmt)];
5472 i++;
5473 if (!is_gimple_assign (stmt)
5474 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5475 continue;
5476 op0 = gimple_op (stmt, 1);
5477 op1 = gimple_op (stmt, 2);
5478 if (TREE_CODE (op0) != SSA_NAME
5479 || TREE_CODE (op1) != SSA_NAME)
5480 continue;
5481 /* Swap operands if the second one is more expensive. */
5482 def0 = get_gimple_for_ssa_name (op0);
5483 def1 = get_gimple_for_ssa_name (op1);
5484 if (!def1)
5485 continue;
5486 swap = false;
5487 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5488 swap = true;
5489 if (swap)
5491 if (dump_file && (dump_flags & TDF_DETAILS))
5493 fprintf (dump_file, "Swap operands in stmt:\n");
5494 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5495 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5496 def0 ? lattice[gimple_uid (def0)] : 0,
5497 lattice[gimple_uid (def1)]);
5499 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5500 gimple_assign_rhs2_ptr (stmt));
5503 XDELETE (lattice);
5506 /* Expand basic block BB from GIMPLE trees to RTL. */
5508 static basic_block
5509 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5511 gimple_stmt_iterator gsi;
5512 gimple_seq stmts;
5513 gimple *stmt = NULL;
5514 rtx_note *note = NULL;
5515 rtx_insn *last;
5516 edge e;
5517 edge_iterator ei;
5519 if (dump_file)
5520 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5521 bb->index);
5523 /* Note that since we are now transitioning from GIMPLE to RTL, we
5524 cannot use the gsi_*_bb() routines because they expect the basic
5525 block to be in GIMPLE, instead of RTL. Therefore, we need to
5526 access the BB sequence directly. */
5527 if (optimize)
5528 reorder_operands (bb);
5529 stmts = bb_seq (bb);
5530 bb->il.gimple.seq = NULL;
5531 bb->il.gimple.phi_nodes = NULL;
5532 rtl_profile_for_bb (bb);
5533 init_rtl_bb_info (bb);
5534 bb->flags |= BB_RTL;
5536 /* Remove the RETURN_EXPR if we may fall though to the exit
5537 instead. */
5538 gsi = gsi_last (stmts);
5539 if (!gsi_end_p (gsi)
5540 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5542 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5544 gcc_assert (single_succ_p (bb));
5545 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5547 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5548 && !gimple_return_retval (ret_stmt))
5550 gsi_remove (&gsi, false);
5551 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5555 gsi = gsi_start (stmts);
5556 if (!gsi_end_p (gsi))
5558 stmt = gsi_stmt (gsi);
5559 if (gimple_code (stmt) != GIMPLE_LABEL)
5560 stmt = NULL;
5563 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5565 if (stmt || elt)
5567 gcc_checking_assert (!note);
5568 last = get_last_insn ();
5570 if (stmt)
5572 expand_gimple_stmt (stmt);
5573 gsi_next (&gsi);
5576 if (elt)
5577 emit_label (*elt);
5579 BB_HEAD (bb) = NEXT_INSN (last);
5580 if (NOTE_P (BB_HEAD (bb)))
5581 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5582 gcc_assert (LABEL_P (BB_HEAD (bb)));
5583 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5585 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5587 else
5588 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5590 if (note)
5591 NOTE_BASIC_BLOCK (note) = bb;
5593 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5595 basic_block new_bb;
5597 stmt = gsi_stmt (gsi);
5599 /* If this statement is a non-debug one, and we generate debug
5600 insns, then this one might be the last real use of a TERed
5601 SSA_NAME, but where there are still some debug uses further
5602 down. Expanding the current SSA name in such further debug
5603 uses by their RHS might lead to wrong debug info, as coalescing
5604 might make the operands of such RHS be placed into the same
5605 pseudo as something else. Like so:
5606 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5607 use(a_1);
5608 a_2 = ...
5609 #DEBUG ... => a_1
5610 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5611 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5612 the write to a_2 would actually have clobbered the place which
5613 formerly held a_0.
5615 So, instead of that, we recognize the situation, and generate
5616 debug temporaries at the last real use of TERed SSA names:
5617 a_1 = a_0 + 1;
5618 #DEBUG #D1 => a_1
5619 use(a_1);
5620 a_2 = ...
5621 #DEBUG ... => #D1
5623 if (MAY_HAVE_DEBUG_BIND_INSNS
5624 && SA.values
5625 && !is_gimple_debug (stmt))
5627 ssa_op_iter iter;
5628 tree op;
5629 gimple *def;
5631 location_t sloc = curr_insn_location ();
5633 /* Look for SSA names that have their last use here (TERed
5634 names always have only one real use). */
5635 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5636 if ((def = get_gimple_for_ssa_name (op)))
5638 imm_use_iterator imm_iter;
5639 use_operand_p use_p;
5640 bool have_debug_uses = false;
5642 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5644 if (gimple_debug_bind_p (USE_STMT (use_p)))
5646 have_debug_uses = true;
5647 break;
5651 if (have_debug_uses)
5653 /* OP is a TERed SSA name, with DEF its defining
5654 statement, and where OP is used in further debug
5655 instructions. Generate a debug temporary, and
5656 replace all uses of OP in debug insns with that
5657 temporary. */
5658 gimple *debugstmt;
5659 tree value = gimple_assign_rhs_to_tree (def);
5660 tree vexpr = make_node (DEBUG_EXPR_DECL);
5661 rtx val;
5662 machine_mode mode;
5664 set_curr_insn_location (gimple_location (def));
5666 DECL_ARTIFICIAL (vexpr) = 1;
5667 TREE_TYPE (vexpr) = TREE_TYPE (value);
5668 if (DECL_P (value))
5669 mode = DECL_MODE (value);
5670 else
5671 mode = TYPE_MODE (TREE_TYPE (value));
5672 SET_DECL_MODE (vexpr, mode);
5674 val = gen_rtx_VAR_LOCATION
5675 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5677 emit_debug_insn (val);
5679 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5681 if (!gimple_debug_bind_p (debugstmt))
5682 continue;
5684 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5685 SET_USE (use_p, vexpr);
5687 update_stmt (debugstmt);
5691 set_curr_insn_location (sloc);
5694 currently_expanding_gimple_stmt = stmt;
5696 /* Expand this statement, then evaluate the resulting RTL and
5697 fixup the CFG accordingly. */
5698 if (gimple_code (stmt) == GIMPLE_COND)
5700 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5701 if (new_bb)
5702 return new_bb;
5704 else if (is_gimple_debug (stmt))
5706 location_t sloc = curr_insn_location ();
5707 gimple_stmt_iterator nsi = gsi;
5709 for (;;)
5711 tree var;
5712 tree value = NULL_TREE;
5713 rtx val = NULL_RTX;
5714 machine_mode mode;
5716 if (!gimple_debug_nonbind_marker_p (stmt))
5718 if (gimple_debug_bind_p (stmt))
5720 var = gimple_debug_bind_get_var (stmt);
5722 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5723 && TREE_CODE (var) != LABEL_DECL
5724 && !target_for_debug_bind (var))
5725 goto delink_debug_stmt;
5727 if (DECL_P (var))
5728 mode = DECL_MODE (var);
5729 else
5730 mode = TYPE_MODE (TREE_TYPE (var));
5732 if (gimple_debug_bind_has_value_p (stmt))
5733 value = gimple_debug_bind_get_value (stmt);
5735 val = gen_rtx_VAR_LOCATION
5736 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5738 else if (gimple_debug_source_bind_p (stmt))
5740 var = gimple_debug_source_bind_get_var (stmt);
5742 value = gimple_debug_source_bind_get_value (stmt);
5744 mode = DECL_MODE (var);
5746 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5747 VAR_INIT_STATUS_UNINITIALIZED);
5749 else
5750 gcc_unreachable ();
5752 /* If this function was first compiled with markers
5753 enabled, but they're now disable (e.g. LTO), drop
5754 them on the floor. */
5755 else if (gimple_debug_nonbind_marker_p (stmt)
5756 && !MAY_HAVE_DEBUG_MARKER_INSNS)
5757 goto delink_debug_stmt;
5758 else if (gimple_debug_begin_stmt_p (stmt))
5759 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
5760 else if (gimple_debug_inline_entry_p (stmt))
5762 tree block = gimple_block (stmt);
5764 if (block)
5765 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
5766 else
5767 goto delink_debug_stmt;
5769 else
5770 gcc_unreachable ();
5772 last = get_last_insn ();
5774 set_curr_insn_location (gimple_location (stmt));
5776 emit_debug_insn (val);
5778 if (dump_file && (dump_flags & TDF_DETAILS))
5780 /* We can't dump the insn with a TREE where an RTX
5781 is expected. */
5782 if (GET_CODE (val) == VAR_LOCATION)
5784 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
5785 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5787 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5788 if (GET_CODE (val) == VAR_LOCATION)
5789 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5792 delink_debug_stmt:
5793 /* In order not to generate too many debug temporaries,
5794 we delink all uses of debug statements we already expanded.
5795 Therefore debug statements between definition and real
5796 use of TERed SSA names will continue to use the SSA name,
5797 and not be replaced with debug temps. */
5798 delink_stmt_imm_use (stmt);
5800 gsi = nsi;
5801 gsi_next (&nsi);
5802 if (gsi_end_p (nsi))
5803 break;
5804 stmt = gsi_stmt (nsi);
5805 if (!is_gimple_debug (stmt))
5806 break;
5809 set_curr_insn_location (sloc);
5811 else
5813 gcall *call_stmt = dyn_cast <gcall *> (stmt);
5814 if (call_stmt
5815 && gimple_call_tail_p (call_stmt)
5816 && disable_tail_calls)
5817 gimple_call_set_tail (call_stmt, false);
5819 if (call_stmt && gimple_call_tail_p (call_stmt))
5821 bool can_fallthru;
5822 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
5823 if (new_bb)
5825 if (can_fallthru)
5826 bb = new_bb;
5827 else
5828 return new_bb;
5831 else
5833 def_operand_p def_p;
5834 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5836 if (def_p != NULL)
5838 /* Ignore this stmt if it is in the list of
5839 replaceable expressions. */
5840 if (SA.values
5841 && bitmap_bit_p (SA.values,
5842 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5843 continue;
5845 last = expand_gimple_stmt (stmt);
5846 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5851 currently_expanding_gimple_stmt = NULL;
5853 /* Expand implicit goto and convert goto_locus. */
5854 FOR_EACH_EDGE (e, ei, bb->succs)
5856 if (e->goto_locus != UNKNOWN_LOCATION)
5857 set_curr_insn_location (e->goto_locus);
5858 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5860 emit_jump (label_rtx_for_bb (e->dest));
5861 e->flags &= ~EDGE_FALLTHRU;
5865 /* Expanded RTL can create a jump in the last instruction of block.
5866 This later might be assumed to be a jump to successor and break edge insertion.
5867 We need to insert dummy move to prevent this. PR41440. */
5868 if (single_succ_p (bb)
5869 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5870 && (last = get_last_insn ())
5871 && (JUMP_P (last)
5872 || (DEBUG_INSN_P (last)
5873 && JUMP_P (prev_nondebug_insn (last)))))
5875 rtx dummy = gen_reg_rtx (SImode);
5876 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5879 do_pending_stack_adjust ();
5881 /* Find the block tail. The last insn in the block is the insn
5882 before a barrier and/or table jump insn. */
5883 last = get_last_insn ();
5884 if (BARRIER_P (last))
5885 last = PREV_INSN (last);
5886 if (JUMP_TABLE_DATA_P (last))
5887 last = PREV_INSN (PREV_INSN (last));
5888 if (BARRIER_P (last))
5889 last = PREV_INSN (last);
5890 BB_END (bb) = last;
5892 update_bb_for_insn (bb);
5894 return bb;
5898 /* Create a basic block for initialization code. */
5900 static basic_block
5901 construct_init_block (void)
5903 basic_block init_block, first_block;
5904 edge e = NULL;
5905 int flags;
5907 /* Multiple entry points not supported yet. */
5908 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5909 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5910 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5911 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5912 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5914 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5916 /* When entry edge points to first basic block, we don't need jump,
5917 otherwise we have to jump into proper target. */
5918 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5920 tree label = gimple_block_label (e->dest);
5922 emit_jump (jump_target_rtx (label));
5923 flags = 0;
5925 else
5926 flags = EDGE_FALLTHRU;
5928 init_block = create_basic_block (NEXT_INSN (get_insns ()),
5929 get_last_insn (),
5930 ENTRY_BLOCK_PTR_FOR_FN (cfun));
5931 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5932 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5933 if (e)
5935 first_block = e->dest;
5936 redirect_edge_succ (e, init_block);
5937 e = make_single_succ_edge (init_block, first_block, flags);
5939 else
5940 e = make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5941 EDGE_FALLTHRU);
5943 update_bb_for_insn (init_block);
5944 return init_block;
5947 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
5948 found in the block tree. */
5950 static void
5951 set_block_levels (tree block, int level)
5953 while (block)
5955 BLOCK_NUMBER (block) = level;
5956 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
5957 block = BLOCK_CHAIN (block);
5961 /* Create a block containing landing pads and similar stuff. */
5963 static void
5964 construct_exit_block (void)
5966 rtx_insn *head = get_last_insn ();
5967 rtx_insn *end;
5968 basic_block exit_block;
5969 edge e, e2;
5970 unsigned ix;
5971 edge_iterator ei;
5972 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
5973 rtx_insn *orig_end = BB_END (prev_bb);
5975 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5977 /* Make sure the locus is set to the end of the function, so that
5978 epilogue line numbers and warnings are set properly. */
5979 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
5980 input_location = cfun->function_end_locus;
5982 /* Generate rtl for function exit. */
5983 expand_function_end ();
5985 end = get_last_insn ();
5986 if (head == end)
5987 return;
5988 /* While emitting the function end we could move end of the last basic
5989 block. */
5990 BB_END (prev_bb) = orig_end;
5991 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
5992 head = NEXT_INSN (head);
5993 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
5994 bb count counting will be confused. Any instructions before that
5995 label are emitted for the case where PREV_BB falls through into the
5996 exit block, so append those instructions to prev_bb in that case. */
5997 if (NEXT_INSN (head) != return_label)
5999 while (NEXT_INSN (head) != return_label)
6001 if (!NOTE_P (NEXT_INSN (head)))
6002 BB_END (prev_bb) = NEXT_INSN (head);
6003 head = NEXT_INSN (head);
6006 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
6007 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
6008 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6010 ix = 0;
6011 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
6013 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
6014 if (!(e->flags & EDGE_ABNORMAL))
6015 redirect_edge_succ (e, exit_block);
6016 else
6017 ix++;
6020 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6021 EDGE_FALLTHRU);
6022 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
6023 if (e2 != e)
6025 exit_block->count -= e2->count ();
6027 update_bb_for_insn (exit_block);
6030 /* Helper function for discover_nonconstant_array_refs.
6031 Look for ARRAY_REF nodes with non-constant indexes and mark them
6032 addressable. */
6034 static tree
6035 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
6036 void *data ATTRIBUTE_UNUSED)
6038 tree t = *tp;
6040 if (IS_TYPE_OR_DECL_P (t))
6041 *walk_subtrees = 0;
6042 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6044 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6045 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
6046 && (!TREE_OPERAND (t, 2)
6047 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6048 || (TREE_CODE (t) == COMPONENT_REF
6049 && (!TREE_OPERAND (t,2)
6050 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6051 || TREE_CODE (t) == BIT_FIELD_REF
6052 || TREE_CODE (t) == REALPART_EXPR
6053 || TREE_CODE (t) == IMAGPART_EXPR
6054 || TREE_CODE (t) == VIEW_CONVERT_EXPR
6055 || CONVERT_EXPR_P (t))
6056 t = TREE_OPERAND (t, 0);
6058 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6060 t = get_base_address (t);
6061 if (t && DECL_P (t)
6062 && DECL_MODE (t) != BLKmode)
6063 TREE_ADDRESSABLE (t) = 1;
6066 *walk_subtrees = 0;
6069 return NULL_TREE;
6072 /* RTL expansion is not able to compile array references with variable
6073 offsets for arrays stored in single register. Discover such
6074 expressions and mark variables as addressable to avoid this
6075 scenario. */
6077 static void
6078 discover_nonconstant_array_refs (void)
6080 basic_block bb;
6081 gimple_stmt_iterator gsi;
6083 FOR_EACH_BB_FN (bb, cfun)
6084 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6086 gimple *stmt = gsi_stmt (gsi);
6087 if (!is_gimple_debug (stmt))
6088 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
6092 /* This function sets crtl->args.internal_arg_pointer to a virtual
6093 register if DRAP is needed. Local register allocator will replace
6094 virtual_incoming_args_rtx with the virtual register. */
6096 static void
6097 expand_stack_alignment (void)
6099 rtx drap_rtx;
6100 unsigned int preferred_stack_boundary;
6102 if (! SUPPORTS_STACK_ALIGNMENT)
6103 return;
6105 if (cfun->calls_alloca
6106 || cfun->has_nonlocal_label
6107 || crtl->has_nonlocal_goto)
6108 crtl->need_drap = true;
6110 /* Call update_stack_boundary here again to update incoming stack
6111 boundary. It may set incoming stack alignment to a different
6112 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6113 use the minimum incoming stack alignment to check if it is OK
6114 to perform sibcall optimization since sibcall optimization will
6115 only align the outgoing stack to incoming stack boundary. */
6116 if (targetm.calls.update_stack_boundary)
6117 targetm.calls.update_stack_boundary ();
6119 /* The incoming stack frame has to be aligned at least at
6120 parm_stack_boundary. */
6121 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6123 /* Update crtl->stack_alignment_estimated and use it later to align
6124 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6125 exceptions since callgraph doesn't collect incoming stack alignment
6126 in this case. */
6127 if (cfun->can_throw_non_call_exceptions
6128 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6129 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6130 else
6131 preferred_stack_boundary = crtl->preferred_stack_boundary;
6132 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6133 crtl->stack_alignment_estimated = preferred_stack_boundary;
6134 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6135 crtl->stack_alignment_needed = preferred_stack_boundary;
6137 gcc_assert (crtl->stack_alignment_needed
6138 <= crtl->stack_alignment_estimated);
6140 crtl->stack_realign_needed
6141 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6142 crtl->stack_realign_tried = crtl->stack_realign_needed;
6144 crtl->stack_realign_processed = true;
6146 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6147 alignment. */
6148 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6149 drap_rtx = targetm.calls.get_drap_rtx ();
6151 /* stack_realign_drap and drap_rtx must match. */
6152 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6154 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6155 if (drap_rtx != NULL)
6157 crtl->args.internal_arg_pointer = drap_rtx;
6159 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6160 needed. */
6161 fixup_tail_calls ();
6166 static void
6167 expand_main_function (void)
6169 #if (defined(INVOKE__main) \
6170 || (!defined(HAS_INIT_SECTION) \
6171 && !defined(INIT_SECTION_ASM_OP) \
6172 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6173 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6174 #endif
6178 /* Expand code to initialize the stack_protect_guard. This is invoked at
6179 the beginning of a function to be protected. */
6181 static void
6182 stack_protect_prologue (void)
6184 tree guard_decl = targetm.stack_protect_guard ();
6185 rtx x, y;
6187 x = expand_normal (crtl->stack_protect_guard);
6188 if (guard_decl)
6189 y = expand_normal (guard_decl);
6190 else
6191 y = const0_rtx;
6193 /* Allow the target to copy from Y to X without leaking Y into a
6194 register. */
6195 if (targetm.have_stack_protect_set ())
6196 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6198 emit_insn (insn);
6199 return;
6202 /* Otherwise do a straight move. */
6203 emit_move_insn (x, y);
6206 /* Translate the intermediate representation contained in the CFG
6207 from GIMPLE trees to RTL.
6209 We do conversion per basic block and preserve/update the tree CFG.
6210 This implies we have to do some magic as the CFG can simultaneously
6211 consist of basic blocks containing RTL and GIMPLE trees. This can
6212 confuse the CFG hooks, so be careful to not manipulate CFG during
6213 the expansion. */
6215 namespace {
6217 const pass_data pass_data_expand =
6219 RTL_PASS, /* type */
6220 "expand", /* name */
6221 OPTGROUP_NONE, /* optinfo_flags */
6222 TV_EXPAND, /* tv_id */
6223 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6224 | PROP_gimple_lcx
6225 | PROP_gimple_lvec
6226 | PROP_gimple_lva), /* properties_required */
6227 PROP_rtl, /* properties_provided */
6228 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
6229 0, /* todo_flags_start */
6230 0, /* todo_flags_finish */
6233 class pass_expand : public rtl_opt_pass
6235 public:
6236 pass_expand (gcc::context *ctxt)
6237 : rtl_opt_pass (pass_data_expand, ctxt)
6240 /* opt_pass methods: */
6241 virtual unsigned int execute (function *);
6243 }; // class pass_expand
6245 unsigned int
6246 pass_expand::execute (function *fun)
6248 basic_block bb, init_block;
6249 edge_iterator ei;
6250 edge e;
6251 rtx_insn *var_seq, *var_ret_seq;
6252 unsigned i;
6254 timevar_push (TV_OUT_OF_SSA);
6255 rewrite_out_of_ssa (&SA);
6256 timevar_pop (TV_OUT_OF_SSA);
6257 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6259 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6261 gimple_stmt_iterator gsi;
6262 FOR_EACH_BB_FN (bb, cfun)
6263 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6264 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6265 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6268 /* Make sure all values used by the optimization passes have sane
6269 defaults. */
6270 reg_renumber = 0;
6272 /* Some backends want to know that we are expanding to RTL. */
6273 currently_expanding_to_rtl = 1;
6274 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6275 free_dominance_info (CDI_DOMINATORS);
6277 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6279 insn_locations_init ();
6280 if (!DECL_IS_BUILTIN (current_function_decl))
6282 /* Eventually, all FEs should explicitly set function_start_locus. */
6283 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6284 set_curr_insn_location
6285 (DECL_SOURCE_LOCATION (current_function_decl));
6286 else
6287 set_curr_insn_location (fun->function_start_locus);
6289 else
6290 set_curr_insn_location (UNKNOWN_LOCATION);
6291 prologue_location = curr_insn_location ();
6293 #ifdef INSN_SCHEDULING
6294 init_sched_attrs ();
6295 #endif
6297 /* Make sure first insn is a note even if we don't want linenums.
6298 This makes sure the first insn will never be deleted.
6299 Also, final expects a note to appear there. */
6300 emit_note (NOTE_INSN_DELETED);
6302 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6303 discover_nonconstant_array_refs ();
6305 targetm.expand_to_rtl_hook ();
6306 crtl->init_stack_alignment ();
6307 fun->cfg->max_jumptable_ents = 0;
6309 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6310 of the function section at exapnsion time to predict distance of calls. */
6311 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6313 /* Expand the variables recorded during gimple lowering. */
6314 timevar_push (TV_VAR_EXPAND);
6315 start_sequence ();
6317 var_ret_seq = expand_used_vars ();
6319 var_seq = get_insns ();
6320 end_sequence ();
6321 timevar_pop (TV_VAR_EXPAND);
6323 /* Honor stack protection warnings. */
6324 if (warn_stack_protect)
6326 if (fun->calls_alloca)
6327 warning (OPT_Wstack_protector,
6328 "stack protector not protecting local variables: "
6329 "variable length buffer");
6330 if (has_short_buffer && !crtl->stack_protect_guard)
6331 warning (OPT_Wstack_protector,
6332 "stack protector not protecting function: "
6333 "all local arrays are less than %d bytes long",
6334 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE));
6337 /* Set up parameters and prepare for return, for the function. */
6338 expand_function_start (current_function_decl);
6340 /* If we emitted any instructions for setting up the variables,
6341 emit them before the FUNCTION_START note. */
6342 if (var_seq)
6344 emit_insn_before (var_seq, parm_birth_insn);
6346 /* In expand_function_end we'll insert the alloca save/restore
6347 before parm_birth_insn. We've just insertted an alloca call.
6348 Adjust the pointer to match. */
6349 parm_birth_insn = var_seq;
6352 /* Now propagate the RTL assignment of each partition to the
6353 underlying var of each SSA_NAME. */
6354 tree name;
6356 FOR_EACH_SSA_NAME (i, name, cfun)
6358 /* We might have generated new SSA names in
6359 update_alias_info_with_stack_vars. They will have a NULL
6360 defining statements, and won't be part of the partitioning,
6361 so ignore those. */
6362 if (!SSA_NAME_DEF_STMT (name))
6363 continue;
6365 adjust_one_expanded_partition_var (name);
6368 /* Clean up RTL of variables that straddle across multiple
6369 partitions, and check that the rtl of any PARM_DECLs that are not
6370 cleaned up is that of their default defs. */
6371 FOR_EACH_SSA_NAME (i, name, cfun)
6373 int part;
6375 /* We might have generated new SSA names in
6376 update_alias_info_with_stack_vars. They will have a NULL
6377 defining statements, and won't be part of the partitioning,
6378 so ignore those. */
6379 if (!SSA_NAME_DEF_STMT (name))
6380 continue;
6381 part = var_to_partition (SA.map, name);
6382 if (part == NO_PARTITION)
6383 continue;
6385 /* If this decl was marked as living in multiple places, reset
6386 this now to NULL. */
6387 tree var = SSA_NAME_VAR (name);
6388 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6389 SET_DECL_RTL (var, NULL);
6390 /* Check that the pseudos chosen by assign_parms are those of
6391 the corresponding default defs. */
6392 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6393 && (TREE_CODE (var) == PARM_DECL
6394 || TREE_CODE (var) == RESULT_DECL))
6396 rtx in = DECL_RTL_IF_SET (var);
6397 gcc_assert (in);
6398 rtx out = SA.partition_to_pseudo[part];
6399 gcc_assert (in == out);
6401 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6402 those expected by debug backends for each parm and for
6403 the result. This is particularly important for stabs,
6404 whose register elimination from parm's DECL_RTL may cause
6405 -fcompare-debug differences as SET_DECL_RTL changes reg's
6406 attrs. So, make sure the RTL already has the parm as the
6407 EXPR, so that it won't change. */
6408 SET_DECL_RTL (var, NULL_RTX);
6409 if (MEM_P (in))
6410 set_mem_attributes (in, var, true);
6411 SET_DECL_RTL (var, in);
6415 /* If this function is `main', emit a call to `__main'
6416 to run global initializers, etc. */
6417 if (DECL_NAME (current_function_decl)
6418 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6419 && DECL_FILE_SCOPE_P (current_function_decl))
6420 expand_main_function ();
6422 /* Initialize the stack_protect_guard field. This must happen after the
6423 call to __main (if any) so that the external decl is initialized. */
6424 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6425 stack_protect_prologue ();
6427 expand_phi_nodes (&SA);
6429 /* Release any stale SSA redirection data. */
6430 redirect_edge_var_map_empty ();
6432 /* Register rtl specific functions for cfg. */
6433 rtl_register_cfg_hooks ();
6435 init_block = construct_init_block ();
6437 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6438 remaining edges later. */
6439 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6440 e->flags &= ~EDGE_EXECUTABLE;
6442 /* If the function has too many markers, drop them while expanding. */
6443 if (cfun->debug_marker_count
6444 >= PARAM_VALUE (PARAM_MAX_DEBUG_MARKER_COUNT))
6445 cfun->debug_nonbind_markers = false;
6447 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6448 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6449 next_bb)
6450 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6452 if (MAY_HAVE_DEBUG_BIND_INSNS)
6453 expand_debug_locations ();
6455 if (deep_ter_debug_map)
6457 delete deep_ter_debug_map;
6458 deep_ter_debug_map = NULL;
6461 /* Free stuff we no longer need after GIMPLE optimizations. */
6462 free_dominance_info (CDI_DOMINATORS);
6463 free_dominance_info (CDI_POST_DOMINATORS);
6464 delete_tree_cfg_annotations (fun);
6466 timevar_push (TV_OUT_OF_SSA);
6467 finish_out_of_ssa (&SA);
6468 timevar_pop (TV_OUT_OF_SSA);
6470 timevar_push (TV_POST_EXPAND);
6471 /* We are no longer in SSA form. */
6472 fun->gimple_df->in_ssa_p = false;
6473 loops_state_clear (LOOP_CLOSED_SSA);
6475 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6476 conservatively to true until they are all profile aware. */
6477 delete lab_rtx_for_bb;
6478 free_histograms (fun);
6480 construct_exit_block ();
6481 insn_locations_finalize ();
6483 if (var_ret_seq)
6485 rtx_insn *after = return_label;
6486 rtx_insn *next = NEXT_INSN (after);
6487 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6488 after = next;
6489 emit_insn_after (var_ret_seq, after);
6492 /* Zap the tree EH table. */
6493 set_eh_throw_stmt_table (fun, NULL);
6495 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6496 split edges which edge insertions might do. */
6497 rebuild_jump_labels (get_insns ());
6499 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun),
6500 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6502 edge e;
6503 edge_iterator ei;
6504 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6506 if (e->insns.r)
6508 rebuild_jump_labels_chain (e->insns.r);
6509 /* Put insns after parm birth, but before
6510 NOTE_INSNS_FUNCTION_BEG. */
6511 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (fun)
6512 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6514 rtx_insn *insns = e->insns.r;
6515 e->insns.r = NULL;
6516 if (NOTE_P (parm_birth_insn)
6517 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6518 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6519 else
6520 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6522 else
6523 commit_one_edge_insertion (e);
6525 else
6526 ei_next (&ei);
6530 /* We're done expanding trees to RTL. */
6531 currently_expanding_to_rtl = 0;
6533 flush_mark_addressable_queue ();
6535 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6536 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6538 edge e;
6539 edge_iterator ei;
6540 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6542 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6543 e->flags &= ~EDGE_EXECUTABLE;
6545 /* At the moment not all abnormal edges match the RTL
6546 representation. It is safe to remove them here as
6547 find_many_sub_basic_blocks will rediscover them.
6548 In the future we should get this fixed properly. */
6549 if ((e->flags & EDGE_ABNORMAL)
6550 && !(e->flags & EDGE_SIBCALL))
6551 remove_edge (e);
6552 else
6553 ei_next (&ei);
6557 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6558 bitmap_ones (blocks);
6559 find_many_sub_basic_blocks (blocks);
6560 purge_all_dead_edges ();
6562 /* After initial rtl generation, call back to finish generating
6563 exception support code. We need to do this before cleaning up
6564 the CFG as the code does not expect dead landing pads. */
6565 if (fun->eh->region_tree != NULL)
6566 finish_eh_generation ();
6568 /* Call expand_stack_alignment after finishing all
6569 updates to crtl->preferred_stack_boundary. */
6570 expand_stack_alignment ();
6572 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6573 function. */
6574 if (crtl->tail_call_emit)
6575 fixup_tail_calls ();
6577 /* BB subdivision may have created basic blocks that are are only reachable
6578 from unlikely bbs but not marked as such in the profile. */
6579 if (optimize)
6580 propagate_unlikely_bbs_forward ();
6582 /* Remove unreachable blocks, otherwise we cannot compute dominators
6583 which are needed for loop state verification. As a side-effect
6584 this also compacts blocks.
6585 ??? We cannot remove trivially dead insns here as for example
6586 the DRAP reg on i?86 is not magically live at this point.
6587 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6588 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6590 checking_verify_flow_info ();
6592 /* Initialize pseudos allocated for hard registers. */
6593 emit_initial_value_sets ();
6595 /* And finally unshare all RTL. */
6596 unshare_all_rtl ();
6598 /* There's no need to defer outputting this function any more; we
6599 know we want to output it. */
6600 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6602 /* Now that we're done expanding trees to RTL, we shouldn't have any
6603 more CONCATs anywhere. */
6604 generating_concat_p = 0;
6606 if (dump_file)
6608 fprintf (dump_file,
6609 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6610 /* And the pass manager will dump RTL for us. */
6613 /* If we're emitting a nested function, make sure its parent gets
6614 emitted as well. Doing otherwise confuses debug info. */
6616 tree parent;
6617 for (parent = DECL_CONTEXT (current_function_decl);
6618 parent != NULL_TREE;
6619 parent = get_containing_scope (parent))
6620 if (TREE_CODE (parent) == FUNCTION_DECL)
6621 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6624 TREE_ASM_WRITTEN (current_function_decl) = 1;
6626 /* After expanding, the return labels are no longer needed. */
6627 return_label = NULL;
6628 naked_return_label = NULL;
6630 /* After expanding, the tm_restart map is no longer needed. */
6631 if (fun->gimple_df->tm_restart)
6632 fun->gimple_df->tm_restart = NULL;
6634 /* Tag the blocks with a depth number so that change_scope can find
6635 the common parent easily. */
6636 set_block_levels (DECL_INITIAL (fun->decl), 0);
6637 default_rtl_profile ();
6639 /* For -dx discard loops now, otherwise IL verify in clean_state will
6640 ICE. */
6641 if (rtl_dump_and_exit)
6643 cfun->curr_properties &= ~PROP_loops;
6644 loop_optimizer_finalize ();
6647 timevar_pop (TV_POST_EXPAND);
6649 return 0;
6652 } // anon namespace
6654 rtl_opt_pass *
6655 make_pass_expand (gcc::context *ctxt)
6657 return new pass_expand (ctxt);