[multiple changes]
[official-gcc.git] / gcc / cfgexpand.c
blob9b3259d12ed198b3e8330751b25d7a87d39eaa0c
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2018 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "params.h"
65 #include "tree-inline.h"
66 #include "value-prof.h"
67 #include "tree-ssa-live.h"
68 #include "tree-outof-ssa.h"
69 #include "cfgloop.h"
70 #include "insn-attr.h" /* For INSN_SCHEDULING. */
71 #include "stringpool.h"
72 #include "attribs.h"
73 #include "asan.h"
74 #include "tree-ssa-address.h"
75 #include "output.h"
76 #include "builtins.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 enum gimple_rhs_class grhs_class;
109 grhs_class = get_gimple_rhs_class (gimple_expr_code (stmt));
111 if (grhs_class == GIMPLE_TERNARY_RHS)
112 t = build3 (gimple_assign_rhs_code (stmt),
113 TREE_TYPE (gimple_assign_lhs (stmt)),
114 gimple_assign_rhs1 (stmt),
115 gimple_assign_rhs2 (stmt),
116 gimple_assign_rhs3 (stmt));
117 else if (grhs_class == GIMPLE_BINARY_RHS)
118 t = build2 (gimple_assign_rhs_code (stmt),
119 TREE_TYPE (gimple_assign_lhs (stmt)),
120 gimple_assign_rhs1 (stmt),
121 gimple_assign_rhs2 (stmt));
122 else if (grhs_class == GIMPLE_UNARY_RHS)
123 t = build1 (gimple_assign_rhs_code (stmt),
124 TREE_TYPE (gimple_assign_lhs (stmt)),
125 gimple_assign_rhs1 (stmt));
126 else if (grhs_class == GIMPLE_SINGLE_RHS)
128 t = gimple_assign_rhs1 (stmt);
129 /* Avoid modifying this tree in place below. */
130 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
131 && gimple_location (stmt) != EXPR_LOCATION (t))
132 || (gimple_block (stmt)
133 && currently_expanding_to_rtl
134 && EXPR_P (t)))
135 t = copy_node (t);
137 else
138 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 struct stack_var
310 /* The Variable. */
311 tree decl;
313 /* Initially, the size of the variable. Later, the size of the partition,
314 if this variable becomes it's partition's representative. */
315 poly_uint64 size;
317 /* The *byte* alignment required for this variable. Or as, with the
318 size, the alignment for this partition. */
319 unsigned int alignb;
321 /* The partition representative. */
322 size_t representative;
324 /* The next stack variable in the partition, or EOC. */
325 size_t next;
327 /* The numbers of conflicting stack variables. */
328 bitmap conflicts;
331 #define EOC ((size_t)-1)
333 /* We have an array of such objects while deciding allocation. */
334 static struct stack_var *stack_vars;
335 static size_t stack_vars_alloc;
336 static size_t stack_vars_num;
337 static hash_map<tree, size_t> *decl_to_stack_part;
339 /* Conflict bitmaps go on this obstack. This allows us to destroy
340 all of them in one big sweep. */
341 static bitmap_obstack stack_var_bitmap_obstack;
343 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
344 is non-decreasing. */
345 static size_t *stack_vars_sorted;
347 /* The phase of the stack frame. This is the known misalignment of
348 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
349 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
350 static int frame_phase;
352 /* Used during expand_used_vars to remember if we saw any decls for
353 which we'd like to enable stack smashing protection. */
354 static bool has_protected_decls;
356 /* Used during expand_used_vars. Remember if we say a character buffer
357 smaller than our cutoff threshold. Used for -Wstack-protector. */
358 static bool has_short_buffer;
360 /* Compute the byte alignment to use for DECL. Ignore alignment
361 we can't do with expected alignment of the stack boundary. */
363 static unsigned int
364 align_local_variable (tree decl)
366 unsigned int align;
368 if (TREE_CODE (decl) == SSA_NAME)
369 align = TYPE_ALIGN (TREE_TYPE (decl));
370 else
372 align = LOCAL_DECL_ALIGNMENT (decl);
373 SET_DECL_ALIGN (decl, align);
375 return align / BITS_PER_UNIT;
378 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
379 down otherwise. Return truncated BASE value. */
381 static inline unsigned HOST_WIDE_INT
382 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
384 return align_up ? (base + align - 1) & -align : base & -align;
387 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
388 Return the frame offset. */
390 static poly_int64
391 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
393 poly_int64 offset, new_frame_offset;
395 if (FRAME_GROWS_DOWNWARD)
397 new_frame_offset
398 = aligned_lower_bound (frame_offset - frame_phase - size,
399 align) + frame_phase;
400 offset = new_frame_offset;
402 else
404 new_frame_offset
405 = aligned_upper_bound (frame_offset - frame_phase,
406 align) + frame_phase;
407 offset = new_frame_offset;
408 new_frame_offset += size;
410 frame_offset = new_frame_offset;
412 if (frame_offset_overflow (frame_offset, cfun->decl))
413 frame_offset = offset = 0;
415 return offset;
418 /* Accumulate DECL into STACK_VARS. */
420 static void
421 add_stack_var (tree decl)
423 struct stack_var *v;
425 if (stack_vars_num >= stack_vars_alloc)
427 if (stack_vars_alloc)
428 stack_vars_alloc = stack_vars_alloc * 3 / 2;
429 else
430 stack_vars_alloc = 32;
431 stack_vars
432 = XRESIZEVEC (struct stack_var, stack_vars, stack_vars_alloc);
434 if (!decl_to_stack_part)
435 decl_to_stack_part = new hash_map<tree, size_t>;
437 v = &stack_vars[stack_vars_num];
438 decl_to_stack_part->put (decl, stack_vars_num);
440 v->decl = decl;
441 tree size = TREE_CODE (decl) == SSA_NAME
442 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
443 : DECL_SIZE_UNIT (decl);
444 v->size = tree_to_poly_uint64 (size);
445 /* Ensure that all variables have size, so that &a != &b for any two
446 variables that are simultaneously live. */
447 if (known_eq (v->size, 0U))
448 v->size = 1;
449 v->alignb = align_local_variable (decl);
450 /* An alignment of zero can mightily confuse us later. */
451 gcc_assert (v->alignb != 0);
453 /* All variables are initially in their own partition. */
454 v->representative = stack_vars_num;
455 v->next = EOC;
457 /* All variables initially conflict with no other. */
458 v->conflicts = NULL;
460 /* Ensure that this decl doesn't get put onto the list twice. */
461 set_rtl (decl, pc_rtx);
463 stack_vars_num++;
466 /* Make the decls associated with luid's X and Y conflict. */
468 static void
469 add_stack_var_conflict (size_t x, size_t y)
471 struct stack_var *a = &stack_vars[x];
472 struct stack_var *b = &stack_vars[y];
473 if (!a->conflicts)
474 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
475 if (!b->conflicts)
476 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
477 bitmap_set_bit (a->conflicts, y);
478 bitmap_set_bit (b->conflicts, x);
481 /* Check whether the decls associated with luid's X and Y conflict. */
483 static bool
484 stack_var_conflict_p (size_t x, size_t y)
486 struct stack_var *a = &stack_vars[x];
487 struct stack_var *b = &stack_vars[y];
488 if (x == y)
489 return false;
490 /* Partitions containing an SSA name result from gimple registers
491 with things like unsupported modes. They are top-level and
492 hence conflict with everything else. */
493 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
494 return true;
496 if (!a->conflicts || !b->conflicts)
497 return false;
498 return bitmap_bit_p (a->conflicts, y);
501 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
502 enter its partition number into bitmap DATA. */
504 static bool
505 visit_op (gimple *, tree op, tree, void *data)
507 bitmap active = (bitmap)data;
508 op = get_base_address (op);
509 if (op
510 && DECL_P (op)
511 && DECL_RTL_IF_SET (op) == pc_rtx)
513 size_t *v = decl_to_stack_part->get (op);
514 if (v)
515 bitmap_set_bit (active, *v);
517 return false;
520 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
521 record conflicts between it and all currently active other partitions
522 from bitmap DATA. */
524 static bool
525 visit_conflict (gimple *, tree op, tree, void *data)
527 bitmap active = (bitmap)data;
528 op = get_base_address (op);
529 if (op
530 && DECL_P (op)
531 && DECL_RTL_IF_SET (op) == pc_rtx)
533 size_t *v = decl_to_stack_part->get (op);
534 if (v && bitmap_set_bit (active, *v))
536 size_t num = *v;
537 bitmap_iterator bi;
538 unsigned i;
539 gcc_assert (num < stack_vars_num);
540 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
541 add_stack_var_conflict (num, i);
544 return false;
547 /* Helper routine for add_scope_conflicts, calculating the active partitions
548 at the end of BB, leaving the result in WORK. We're called to generate
549 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
550 liveness. */
552 static void
553 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
555 edge e;
556 edge_iterator ei;
557 gimple_stmt_iterator gsi;
558 walk_stmt_load_store_addr_fn visit;
560 bitmap_clear (work);
561 FOR_EACH_EDGE (e, ei, bb->preds)
562 bitmap_ior_into (work, (bitmap)e->src->aux);
564 visit = visit_op;
566 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
568 gimple *stmt = gsi_stmt (gsi);
569 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
571 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
573 gimple *stmt = gsi_stmt (gsi);
575 if (gimple_clobber_p (stmt))
577 tree lhs = gimple_assign_lhs (stmt);
578 size_t *v;
579 /* Nested function lowering might introduce LHSs
580 that are COMPONENT_REFs. */
581 if (!VAR_P (lhs))
582 continue;
583 if (DECL_RTL_IF_SET (lhs) == pc_rtx
584 && (v = decl_to_stack_part->get (lhs)))
585 bitmap_clear_bit (work, *v);
587 else if (!is_gimple_debug (stmt))
589 if (for_conflict
590 && visit == visit_op)
592 /* If this is the first real instruction in this BB we need
593 to add conflicts for everything live at this point now.
594 Unlike classical liveness for named objects we can't
595 rely on seeing a def/use of the names we're interested in.
596 There might merely be indirect loads/stores. We'd not add any
597 conflicts for such partitions. */
598 bitmap_iterator bi;
599 unsigned i;
600 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
602 struct stack_var *a = &stack_vars[i];
603 if (!a->conflicts)
604 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
605 bitmap_ior_into (a->conflicts, work);
607 visit = visit_conflict;
609 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
614 /* Generate stack partition conflicts between all partitions that are
615 simultaneously live. */
617 static void
618 add_scope_conflicts (void)
620 basic_block bb;
621 bool changed;
622 bitmap work = BITMAP_ALLOC (NULL);
623 int *rpo;
624 int n_bbs;
626 /* We approximate the live range of a stack variable by taking the first
627 mention of its name as starting point(s), and by the end-of-scope
628 death clobber added by gimplify as ending point(s) of the range.
629 This overapproximates in the case we for instance moved an address-taken
630 operation upward, without also moving a dereference to it upwards.
631 But it's conservatively correct as a variable never can hold values
632 before its name is mentioned at least once.
634 We then do a mostly classical bitmap liveness algorithm. */
636 FOR_ALL_BB_FN (bb, cfun)
637 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
639 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
640 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
642 changed = true;
643 while (changed)
645 int i;
646 changed = false;
647 for (i = 0; i < n_bbs; i++)
649 bitmap active;
650 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
651 active = (bitmap)bb->aux;
652 add_scope_conflicts_1 (bb, work, false);
653 if (bitmap_ior_into (active, work))
654 changed = true;
658 FOR_EACH_BB_FN (bb, cfun)
659 add_scope_conflicts_1 (bb, work, true);
661 free (rpo);
662 BITMAP_FREE (work);
663 FOR_ALL_BB_FN (bb, cfun)
664 BITMAP_FREE (bb->aux);
667 /* A subroutine of partition_stack_vars. A comparison function for qsort,
668 sorting an array of indices by the properties of the object. */
670 static int
671 stack_var_cmp (const void *a, const void *b)
673 size_t ia = *(const size_t *)a;
674 size_t ib = *(const size_t *)b;
675 unsigned int aligna = stack_vars[ia].alignb;
676 unsigned int alignb = stack_vars[ib].alignb;
677 poly_int64 sizea = stack_vars[ia].size;
678 poly_int64 sizeb = stack_vars[ib].size;
679 tree decla = stack_vars[ia].decl;
680 tree declb = stack_vars[ib].decl;
681 bool largea, largeb;
682 unsigned int uida, uidb;
684 /* Primary compare on "large" alignment. Large comes first. */
685 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
686 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
687 if (largea != largeb)
688 return (int)largeb - (int)largea;
690 /* Secondary compare on size, decreasing */
691 int diff = compare_sizes_for_sort (sizeb, sizea);
692 if (diff != 0)
693 return diff;
695 /* Tertiary compare on true alignment, decreasing. */
696 if (aligna < alignb)
697 return -1;
698 if (aligna > alignb)
699 return 1;
701 /* Final compare on ID for sort stability, increasing.
702 Two SSA names are compared by their version, SSA names come before
703 non-SSA names, and two normal decls are compared by their DECL_UID. */
704 if (TREE_CODE (decla) == SSA_NAME)
706 if (TREE_CODE (declb) == SSA_NAME)
707 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
708 else
709 return -1;
711 else if (TREE_CODE (declb) == SSA_NAME)
712 return 1;
713 else
714 uida = DECL_UID (decla), uidb = DECL_UID (declb);
715 if (uida < uidb)
716 return 1;
717 if (uida > uidb)
718 return -1;
719 return 0;
722 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
723 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
725 /* If the points-to solution *PI points to variables that are in a partition
726 together with other variables add all partition members to the pointed-to
727 variables bitmap. */
729 static void
730 add_partitioned_vars_to_ptset (struct pt_solution *pt,
731 part_hashmap *decls_to_partitions,
732 hash_set<bitmap> *visited, bitmap temp)
734 bitmap_iterator bi;
735 unsigned i;
736 bitmap *part;
738 if (pt->anything
739 || pt->vars == NULL
740 /* The pointed-to vars bitmap is shared, it is enough to
741 visit it once. */
742 || visited->add (pt->vars))
743 return;
745 bitmap_clear (temp);
747 /* By using a temporary bitmap to store all members of the partitions
748 we have to add we make sure to visit each of the partitions only
749 once. */
750 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
751 if ((!temp
752 || !bitmap_bit_p (temp, i))
753 && (part = decls_to_partitions->get (i)))
754 bitmap_ior_into (temp, *part);
755 if (!bitmap_empty_p (temp))
756 bitmap_ior_into (pt->vars, temp);
759 /* Update points-to sets based on partition info, so we can use them on RTL.
760 The bitmaps representing stack partitions will be saved until expand,
761 where partitioned decls used as bases in memory expressions will be
762 rewritten. */
764 static void
765 update_alias_info_with_stack_vars (void)
767 part_hashmap *decls_to_partitions = NULL;
768 size_t i, j;
769 tree var = NULL_TREE;
771 for (i = 0; i < stack_vars_num; i++)
773 bitmap part = NULL;
774 tree name;
775 struct ptr_info_def *pi;
777 /* Not interested in partitions with single variable. */
778 if (stack_vars[i].representative != i
779 || stack_vars[i].next == EOC)
780 continue;
782 if (!decls_to_partitions)
784 decls_to_partitions = new part_hashmap;
785 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
788 /* Create an SSA_NAME that points to the partition for use
789 as base during alias-oracle queries on RTL for bases that
790 have been partitioned. */
791 if (var == NULL_TREE)
792 var = create_tmp_var (ptr_type_node);
793 name = make_ssa_name (var);
795 /* Create bitmaps representing partitions. They will be used for
796 points-to sets later, so use GGC alloc. */
797 part = BITMAP_GGC_ALLOC ();
798 for (j = i; j != EOC; j = stack_vars[j].next)
800 tree decl = stack_vars[j].decl;
801 unsigned int uid = DECL_PT_UID (decl);
802 bitmap_set_bit (part, uid);
803 decls_to_partitions->put (uid, part);
804 cfun->gimple_df->decls_to_pointers->put (decl, name);
805 if (TREE_ADDRESSABLE (decl))
806 TREE_ADDRESSABLE (name) = 1;
809 /* Make the SSA name point to all partition members. */
810 pi = get_ptr_info (name);
811 pt_solution_set (&pi->pt, part, false);
814 /* Make all points-to sets that contain one member of a partition
815 contain all members of the partition. */
816 if (decls_to_partitions)
818 unsigned i;
819 tree name;
820 hash_set<bitmap> visited;
821 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
823 FOR_EACH_SSA_NAME (i, name, cfun)
825 struct ptr_info_def *pi;
827 if (POINTER_TYPE_P (TREE_TYPE (name))
828 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
829 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
830 &visited, temp);
833 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
834 decls_to_partitions, &visited, temp);
836 delete decls_to_partitions;
837 BITMAP_FREE (temp);
841 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
842 partitioning algorithm. Partitions A and B are known to be non-conflicting.
843 Merge them into a single partition A. */
845 static void
846 union_stack_vars (size_t a, size_t b)
848 struct stack_var *vb = &stack_vars[b];
849 bitmap_iterator bi;
850 unsigned u;
852 gcc_assert (stack_vars[b].next == EOC);
853 /* Add B to A's partition. */
854 stack_vars[b].next = stack_vars[a].next;
855 stack_vars[b].representative = a;
856 stack_vars[a].next = b;
858 /* Update the required alignment of partition A to account for B. */
859 if (stack_vars[a].alignb < stack_vars[b].alignb)
860 stack_vars[a].alignb = stack_vars[b].alignb;
862 /* Update the interference graph and merge the conflicts. */
863 if (vb->conflicts)
865 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
866 add_stack_var_conflict (a, stack_vars[u].representative);
867 BITMAP_FREE (vb->conflicts);
871 /* A subroutine of expand_used_vars. Binpack the variables into
872 partitions constrained by the interference graph. The overall
873 algorithm used is as follows:
875 Sort the objects by size in descending order.
876 For each object A {
877 S = size(A)
878 O = 0
879 loop {
880 Look for the largest non-conflicting object B with size <= S.
881 UNION (A, B)
886 static void
887 partition_stack_vars (void)
889 size_t si, sj, n = stack_vars_num;
891 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
892 for (si = 0; si < n; ++si)
893 stack_vars_sorted[si] = si;
895 if (n == 1)
896 return;
898 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
900 for (si = 0; si < n; ++si)
902 size_t i = stack_vars_sorted[si];
903 unsigned int ialign = stack_vars[i].alignb;
904 poly_int64 isize = stack_vars[i].size;
906 /* Ignore objects that aren't partition representatives. If we
907 see a var that is not a partition representative, it must
908 have been merged earlier. */
909 if (stack_vars[i].representative != i)
910 continue;
912 for (sj = si + 1; sj < n; ++sj)
914 size_t j = stack_vars_sorted[sj];
915 unsigned int jalign = stack_vars[j].alignb;
916 poly_int64 jsize = stack_vars[j].size;
918 /* Ignore objects that aren't partition representatives. */
919 if (stack_vars[j].representative != j)
920 continue;
922 /* Do not mix objects of "small" (supported) alignment
923 and "large" (unsupported) alignment. */
924 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
925 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
926 break;
928 /* For Address Sanitizer do not mix objects with different
929 sizes, as the shorter vars wouldn't be adequately protected.
930 Don't do that for "large" (unsupported) alignment objects,
931 those aren't protected anyway. */
932 if (asan_sanitize_stack_p ()
933 && maybe_ne (isize, jsize)
934 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
935 break;
937 /* Ignore conflicting objects. */
938 if (stack_var_conflict_p (i, j))
939 continue;
941 /* UNION the objects, placing J at OFFSET. */
942 union_stack_vars (i, j);
946 update_alias_info_with_stack_vars ();
949 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
951 static void
952 dump_stack_var_partition (void)
954 size_t si, i, j, n = stack_vars_num;
956 for (si = 0; si < n; ++si)
958 i = stack_vars_sorted[si];
960 /* Skip variables that aren't partition representatives, for now. */
961 if (stack_vars[i].representative != i)
962 continue;
964 fprintf (dump_file, "Partition %lu: size ", (unsigned long) i);
965 print_dec (stack_vars[i].size, dump_file);
966 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
968 for (j = i; j != EOC; j = stack_vars[j].next)
970 fputc ('\t', dump_file);
971 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
973 fputc ('\n', dump_file);
977 /* Assign rtl to DECL at BASE + OFFSET. */
979 static void
980 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
981 poly_int64 offset)
983 unsigned align;
984 rtx x;
986 /* If this fails, we've overflowed the stack frame. Error nicely? */
987 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
989 x = plus_constant (Pmode, base, offset);
990 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
991 ? TYPE_MODE (TREE_TYPE (decl))
992 : DECL_MODE (SSAVAR (decl)), x);
994 if (TREE_CODE (decl) != SSA_NAME)
996 /* Set alignment we actually gave this decl if it isn't an SSA name.
997 If it is we generate stack slots only accidentally so it isn't as
998 important, we'll simply use the alignment that is already set. */
999 if (base == virtual_stack_vars_rtx)
1000 offset -= frame_phase;
1001 align = known_alignment (offset);
1002 align *= BITS_PER_UNIT;
1003 if (align == 0 || align > base_align)
1004 align = base_align;
1006 /* One would think that we could assert that we're not decreasing
1007 alignment here, but (at least) the i386 port does exactly this
1008 via the MINIMUM_ALIGNMENT hook. */
1010 SET_DECL_ALIGN (decl, align);
1011 DECL_USER_ALIGN (decl) = 0;
1014 set_rtl (decl, x);
1017 struct stack_vars_data
1019 /* Vector of offset pairs, always end of some padding followed
1020 by start of the padding that needs Address Sanitizer protection.
1021 The vector is in reversed, highest offset pairs come first. */
1022 auto_vec<HOST_WIDE_INT> asan_vec;
1024 /* Vector of partition representative decls in between the paddings. */
1025 auto_vec<tree> asan_decl_vec;
1027 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1028 rtx asan_base;
1030 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1031 unsigned int asan_alignb;
1034 /* A subroutine of expand_used_vars. Give each partition representative
1035 a unique location within the stack frame. Update each partition member
1036 with that location. */
1038 static void
1039 expand_stack_vars (bool (*pred) (size_t), struct stack_vars_data *data)
1041 size_t si, i, j, n = stack_vars_num;
1042 poly_uint64 large_size = 0, large_alloc = 0;
1043 rtx large_base = NULL;
1044 unsigned large_align = 0;
1045 bool large_allocation_done = false;
1046 tree decl;
1048 /* Determine if there are any variables requiring "large" alignment.
1049 Since these are dynamically allocated, we only process these if
1050 no predicate involved. */
1051 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1052 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1054 /* Find the total size of these variables. */
1055 for (si = 0; si < n; ++si)
1057 unsigned alignb;
1059 i = stack_vars_sorted[si];
1060 alignb = stack_vars[i].alignb;
1062 /* All "large" alignment decls come before all "small" alignment
1063 decls, but "large" alignment decls are not sorted based on
1064 their alignment. Increase large_align to track the largest
1065 required alignment. */
1066 if ((alignb * BITS_PER_UNIT) > large_align)
1067 large_align = alignb * BITS_PER_UNIT;
1069 /* Stop when we get to the first decl with "small" alignment. */
1070 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1071 break;
1073 /* Skip variables that aren't partition representatives. */
1074 if (stack_vars[i].representative != i)
1075 continue;
1077 /* Skip variables that have already had rtl assigned. See also
1078 add_stack_var where we perpetrate this pc_rtx hack. */
1079 decl = stack_vars[i].decl;
1080 if (TREE_CODE (decl) == SSA_NAME
1081 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1082 : DECL_RTL (decl) != pc_rtx)
1083 continue;
1085 large_size = aligned_upper_bound (large_size, alignb);
1086 large_size += stack_vars[i].size;
1090 for (si = 0; si < n; ++si)
1092 rtx base;
1093 unsigned base_align, alignb;
1094 poly_int64 offset;
1096 i = stack_vars_sorted[si];
1098 /* Skip variables that aren't partition representatives, for now. */
1099 if (stack_vars[i].representative != i)
1100 continue;
1102 /* Skip variables that have already had rtl assigned. See also
1103 add_stack_var where we perpetrate this pc_rtx hack. */
1104 decl = stack_vars[i].decl;
1105 if (TREE_CODE (decl) == SSA_NAME
1106 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1107 : DECL_RTL (decl) != pc_rtx)
1108 continue;
1110 /* Check the predicate to see whether this variable should be
1111 allocated in this pass. */
1112 if (pred && !pred (i))
1113 continue;
1115 alignb = stack_vars[i].alignb;
1116 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1118 base = virtual_stack_vars_rtx;
1119 /* ASAN description strings don't yet have a syntax for expressing
1120 polynomial offsets. */
1121 HOST_WIDE_INT prev_offset;
1122 if (asan_sanitize_stack_p ()
1123 && pred
1124 && frame_offset.is_constant (&prev_offset)
1125 && stack_vars[i].size.is_constant ())
1127 if (data->asan_vec.is_empty ())
1129 alloc_stack_frame_space (0, ASAN_RED_ZONE_SIZE);
1130 prev_offset = frame_offset.to_constant ();
1132 prev_offset = align_base (prev_offset,
1133 MAX (alignb, ASAN_MIN_RED_ZONE_SIZE),
1134 !FRAME_GROWS_DOWNWARD);
1135 tree repr_decl = NULL_TREE;
1136 unsigned HOST_WIDE_INT size
1137 = asan_var_and_redzone_size (stack_vars[i].size.to_constant ());
1138 if (data->asan_vec.is_empty ())
1139 size = MAX (size, ASAN_RED_ZONE_SIZE);
1141 unsigned HOST_WIDE_INT alignment = MAX (alignb,
1142 ASAN_MIN_RED_ZONE_SIZE);
1143 offset = alloc_stack_frame_space (size, alignment);
1145 data->asan_vec.safe_push (prev_offset);
1146 /* Allocating a constant amount of space from a constant
1147 starting offset must give a constant result. */
1148 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1149 .to_constant ());
1150 /* Find best representative of the partition.
1151 Prefer those with DECL_NAME, even better
1152 satisfying asan_protect_stack_decl predicate. */
1153 for (j = i; j != EOC; j = stack_vars[j].next)
1154 if (asan_protect_stack_decl (stack_vars[j].decl)
1155 && DECL_NAME (stack_vars[j].decl))
1157 repr_decl = stack_vars[j].decl;
1158 break;
1160 else if (repr_decl == NULL_TREE
1161 && DECL_P (stack_vars[j].decl)
1162 && DECL_NAME (stack_vars[j].decl))
1163 repr_decl = stack_vars[j].decl;
1164 if (repr_decl == NULL_TREE)
1165 repr_decl = stack_vars[i].decl;
1166 data->asan_decl_vec.safe_push (repr_decl);
1168 /* Make sure a representative is unpoison if another
1169 variable in the partition is handled by
1170 use-after-scope sanitization. */
1171 if (asan_handled_variables != NULL
1172 && !asan_handled_variables->contains (repr_decl))
1174 for (j = i; j != EOC; j = stack_vars[j].next)
1175 if (asan_handled_variables->contains (stack_vars[j].decl))
1176 break;
1177 if (j != EOC)
1178 asan_handled_variables->add (repr_decl);
1181 data->asan_alignb = MAX (data->asan_alignb, alignb);
1182 if (data->asan_base == NULL)
1183 data->asan_base = gen_reg_rtx (Pmode);
1184 base = data->asan_base;
1186 if (!STRICT_ALIGNMENT)
1187 base_align = crtl->max_used_stack_slot_alignment;
1188 else
1189 base_align = MAX (crtl->max_used_stack_slot_alignment,
1190 GET_MODE_ALIGNMENT (SImode)
1191 << ASAN_SHADOW_SHIFT);
1193 else
1195 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1196 base_align = crtl->max_used_stack_slot_alignment;
1199 else
1201 /* Large alignment is only processed in the last pass. */
1202 if (pred)
1203 continue;
1205 /* If there were any variables requiring "large" alignment, allocate
1206 space. */
1207 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1209 poly_int64 loffset;
1210 rtx large_allocsize;
1212 large_allocsize = gen_int_mode (large_size, Pmode);
1213 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1214 loffset = alloc_stack_frame_space
1215 (rtx_to_poly_int64 (large_allocsize),
1216 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1217 large_base = get_dynamic_stack_base (loffset, large_align);
1218 large_allocation_done = true;
1220 gcc_assert (large_base != NULL);
1222 large_alloc = aligned_upper_bound (large_alloc, alignb);
1223 offset = large_alloc;
1224 large_alloc += stack_vars[i].size;
1226 base = large_base;
1227 base_align = large_align;
1230 /* Create rtl for each variable based on their location within the
1231 partition. */
1232 for (j = i; j != EOC; j = stack_vars[j].next)
1234 expand_one_stack_var_at (stack_vars[j].decl,
1235 base, base_align,
1236 offset);
1240 gcc_assert (known_eq (large_alloc, large_size));
1243 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1244 static poly_uint64
1245 account_stack_vars (void)
1247 size_t si, j, i, n = stack_vars_num;
1248 poly_uint64 size = 0;
1250 for (si = 0; si < n; ++si)
1252 i = stack_vars_sorted[si];
1254 /* Skip variables that aren't partition representatives, for now. */
1255 if (stack_vars[i].representative != i)
1256 continue;
1258 size += stack_vars[i].size;
1259 for (j = i; j != EOC; j = stack_vars[j].next)
1260 set_rtl (stack_vars[j].decl, NULL);
1262 return size;
1265 /* Record the RTL assignment X for the default def of PARM. */
1267 extern void
1268 set_parm_rtl (tree parm, rtx x)
1270 gcc_assert (TREE_CODE (parm) == PARM_DECL
1271 || TREE_CODE (parm) == RESULT_DECL);
1273 if (x && !MEM_P (x))
1275 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1276 TYPE_MODE (TREE_TYPE (parm)),
1277 TYPE_ALIGN (TREE_TYPE (parm)));
1279 /* If the variable alignment is very large we'll dynamicaly
1280 allocate it, which means that in-frame portion is just a
1281 pointer. ??? We've got a pseudo for sure here, do we
1282 actually dynamically allocate its spilling area if needed?
1283 ??? Isn't it a problem when Pmode alignment also exceeds
1284 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1285 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1286 align = GET_MODE_ALIGNMENT (Pmode);
1288 record_alignment_for_reg_var (align);
1291 tree ssa = ssa_default_def (cfun, parm);
1292 if (!ssa)
1293 return set_rtl (parm, x);
1295 int part = var_to_partition (SA.map, ssa);
1296 gcc_assert (part != NO_PARTITION);
1298 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1299 gcc_assert (changed);
1301 set_rtl (ssa, x);
1302 gcc_assert (DECL_RTL (parm) == x);
1305 /* A subroutine of expand_one_var. Called to immediately assign rtl
1306 to a variable to be allocated in the stack frame. */
1308 static void
1309 expand_one_stack_var_1 (tree var)
1311 poly_uint64 size;
1312 poly_int64 offset;
1313 unsigned byte_align;
1315 if (TREE_CODE (var) == SSA_NAME)
1317 tree type = TREE_TYPE (var);
1318 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1319 byte_align = TYPE_ALIGN_UNIT (type);
1321 else
1323 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1324 byte_align = align_local_variable (var);
1327 /* We handle highly aligned variables in expand_stack_vars. */
1328 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1330 offset = alloc_stack_frame_space (size, byte_align);
1332 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1333 crtl->max_used_stack_slot_alignment, offset);
1336 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1337 already assigned some MEM. */
1339 static void
1340 expand_one_stack_var (tree var)
1342 if (TREE_CODE (var) == SSA_NAME)
1344 int part = var_to_partition (SA.map, var);
1345 if (part != NO_PARTITION)
1347 rtx x = SA.partition_to_pseudo[part];
1348 gcc_assert (x);
1349 gcc_assert (MEM_P (x));
1350 return;
1354 return expand_one_stack_var_1 (var);
1357 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1358 that will reside in a hard register. */
1360 static void
1361 expand_one_hard_reg_var (tree var)
1363 rest_of_decl_compilation (var, 0, 0);
1366 /* Record the alignment requirements of some variable assigned to a
1367 pseudo. */
1369 static void
1370 record_alignment_for_reg_var (unsigned int align)
1372 if (SUPPORTS_STACK_ALIGNMENT
1373 && crtl->stack_alignment_estimated < align)
1375 /* stack_alignment_estimated shouldn't change after stack
1376 realign decision made */
1377 gcc_assert (!crtl->stack_realign_processed);
1378 crtl->stack_alignment_estimated = align;
1381 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1382 So here we only make sure stack_alignment_needed >= align. */
1383 if (crtl->stack_alignment_needed < align)
1384 crtl->stack_alignment_needed = align;
1385 if (crtl->max_used_stack_slot_alignment < align)
1386 crtl->max_used_stack_slot_alignment = align;
1389 /* Create RTL for an SSA partition. */
1391 static void
1392 expand_one_ssa_partition (tree var)
1394 int part = var_to_partition (SA.map, var);
1395 gcc_assert (part != NO_PARTITION);
1397 if (SA.partition_to_pseudo[part])
1398 return;
1400 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1401 TYPE_MODE (TREE_TYPE (var)),
1402 TYPE_ALIGN (TREE_TYPE (var)));
1404 /* If the variable alignment is very large we'll dynamicaly allocate
1405 it, which means that in-frame portion is just a pointer. */
1406 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1407 align = GET_MODE_ALIGNMENT (Pmode);
1409 record_alignment_for_reg_var (align);
1411 if (!use_register_for_decl (var))
1413 if (defer_stack_allocation (var, true))
1414 add_stack_var (var);
1415 else
1416 expand_one_stack_var_1 (var);
1417 return;
1420 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1421 rtx x = gen_reg_rtx (reg_mode);
1423 set_rtl (var, x);
1425 /* For a promoted variable, X will not be used directly but wrapped in a
1426 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1427 will assume that its upper bits can be inferred from its lower bits.
1428 Therefore, if X isn't initialized on every path from the entry, then
1429 we must do it manually in order to fulfill the above assumption. */
1430 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1431 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1432 emit_move_insn (x, CONST0_RTX (reg_mode));
1435 /* Record the association between the RTL generated for partition PART
1436 and the underlying variable of the SSA_NAME VAR. */
1438 static void
1439 adjust_one_expanded_partition_var (tree var)
1441 if (!var)
1442 return;
1444 tree decl = SSA_NAME_VAR (var);
1446 int part = var_to_partition (SA.map, var);
1447 if (part == NO_PARTITION)
1448 return;
1450 rtx x = SA.partition_to_pseudo[part];
1452 gcc_assert (x);
1454 set_rtl (var, x);
1456 if (!REG_P (x))
1457 return;
1459 /* Note if the object is a user variable. */
1460 if (decl && !DECL_ARTIFICIAL (decl))
1461 mark_user_reg (x);
1463 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1464 mark_reg_pointer (x, get_pointer_alignment (var));
1467 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1468 that will reside in a pseudo register. */
1470 static void
1471 expand_one_register_var (tree var)
1473 if (TREE_CODE (var) == SSA_NAME)
1475 int part = var_to_partition (SA.map, var);
1476 if (part != NO_PARTITION)
1478 rtx x = SA.partition_to_pseudo[part];
1479 gcc_assert (x);
1480 gcc_assert (REG_P (x));
1481 return;
1483 gcc_unreachable ();
1486 tree decl = var;
1487 tree type = TREE_TYPE (decl);
1488 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1489 rtx x = gen_reg_rtx (reg_mode);
1491 set_rtl (var, x);
1493 /* Note if the object is a user variable. */
1494 if (!DECL_ARTIFICIAL (decl))
1495 mark_user_reg (x);
1497 if (POINTER_TYPE_P (type))
1498 mark_reg_pointer (x, get_pointer_alignment (var));
1501 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1502 has some associated error, e.g. its type is error-mark. We just need
1503 to pick something that won't crash the rest of the compiler. */
1505 static void
1506 expand_one_error_var (tree var)
1508 machine_mode mode = DECL_MODE (var);
1509 rtx x;
1511 if (mode == BLKmode)
1512 x = gen_rtx_MEM (BLKmode, const0_rtx);
1513 else if (mode == VOIDmode)
1514 x = const0_rtx;
1515 else
1516 x = gen_reg_rtx (mode);
1518 SET_DECL_RTL (var, x);
1521 /* A subroutine of expand_one_var. VAR is a variable that will be
1522 allocated to the local stack frame. Return true if we wish to
1523 add VAR to STACK_VARS so that it will be coalesced with other
1524 variables. Return false to allocate VAR immediately.
1526 This function is used to reduce the number of variables considered
1527 for coalescing, which reduces the size of the quadratic problem. */
1529 static bool
1530 defer_stack_allocation (tree var, bool toplevel)
1532 tree size_unit = TREE_CODE (var) == SSA_NAME
1533 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1534 : DECL_SIZE_UNIT (var);
1535 poly_uint64 size;
1537 /* Whether the variable is small enough for immediate allocation not to be
1538 a problem with regard to the frame size. */
1539 bool smallish
1540 = (poly_int_tree_p (size_unit, &size)
1541 && (estimated_poly_value (size)
1542 < PARAM_VALUE (PARAM_MIN_SIZE_FOR_STACK_SHARING)));
1544 /* If stack protection is enabled, *all* stack variables must be deferred,
1545 so that we can re-order the strings to the top of the frame.
1546 Similarly for Address Sanitizer. */
1547 if (flag_stack_protect || asan_sanitize_stack_p ())
1548 return true;
1550 unsigned int align = TREE_CODE (var) == SSA_NAME
1551 ? TYPE_ALIGN (TREE_TYPE (var))
1552 : DECL_ALIGN (var);
1554 /* We handle "large" alignment via dynamic allocation. We want to handle
1555 this extra complication in only one place, so defer them. */
1556 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1557 return true;
1559 bool ignored = TREE_CODE (var) == SSA_NAME
1560 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1561 : DECL_IGNORED_P (var);
1563 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1564 might be detached from their block and appear at toplevel when we reach
1565 here. We want to coalesce them with variables from other blocks when
1566 the immediate contribution to the frame size would be noticeable. */
1567 if (toplevel && optimize > 0 && ignored && !smallish)
1568 return true;
1570 /* Variables declared in the outermost scope automatically conflict
1571 with every other variable. The only reason to want to defer them
1572 at all is that, after sorting, we can more efficiently pack
1573 small variables in the stack frame. Continue to defer at -O2. */
1574 if (toplevel && optimize < 2)
1575 return false;
1577 /* Without optimization, *most* variables are allocated from the
1578 stack, which makes the quadratic problem large exactly when we
1579 want compilation to proceed as quickly as possible. On the
1580 other hand, we don't want the function's stack frame size to
1581 get completely out of hand. So we avoid adding scalars and
1582 "small" aggregates to the list at all. */
1583 if (optimize == 0 && smallish)
1584 return false;
1586 return true;
1589 /* A subroutine of expand_used_vars. Expand one variable according to
1590 its flavor. Variables to be placed on the stack are not actually
1591 expanded yet, merely recorded.
1592 When REALLY_EXPAND is false, only add stack values to be allocated.
1593 Return stack usage this variable is supposed to take.
1596 static poly_uint64
1597 expand_one_var (tree var, bool toplevel, bool really_expand)
1599 unsigned int align = BITS_PER_UNIT;
1600 tree origvar = var;
1602 var = SSAVAR (var);
1604 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1606 if (is_global_var (var))
1607 return 0;
1609 /* Because we don't know if VAR will be in register or on stack,
1610 we conservatively assume it will be on stack even if VAR is
1611 eventually put into register after RA pass. For non-automatic
1612 variables, which won't be on stack, we collect alignment of
1613 type and ignore user specified alignment. Similarly for
1614 SSA_NAMEs for which use_register_for_decl returns true. */
1615 if (TREE_STATIC (var)
1616 || DECL_EXTERNAL (var)
1617 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1618 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1619 TYPE_MODE (TREE_TYPE (var)),
1620 TYPE_ALIGN (TREE_TYPE (var)));
1621 else if (DECL_HAS_VALUE_EXPR_P (var)
1622 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1623 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1624 or variables which were assigned a stack slot already by
1625 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1626 changed from the offset chosen to it. */
1627 align = crtl->stack_alignment_estimated;
1628 else
1629 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1631 /* If the variable alignment is very large we'll dynamicaly allocate
1632 it, which means that in-frame portion is just a pointer. */
1633 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1634 align = GET_MODE_ALIGNMENT (Pmode);
1637 record_alignment_for_reg_var (align);
1639 poly_uint64 size;
1640 if (TREE_CODE (origvar) == SSA_NAME)
1642 gcc_assert (!VAR_P (var)
1643 || (!DECL_EXTERNAL (var)
1644 && !DECL_HAS_VALUE_EXPR_P (var)
1645 && !TREE_STATIC (var)
1646 && TREE_TYPE (var) != error_mark_node
1647 && !DECL_HARD_REGISTER (var)
1648 && really_expand));
1650 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1652 else if (DECL_EXTERNAL (var))
1654 else if (DECL_HAS_VALUE_EXPR_P (var))
1656 else if (TREE_STATIC (var))
1658 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1660 else if (TREE_TYPE (var) == error_mark_node)
1662 if (really_expand)
1663 expand_one_error_var (var);
1665 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1667 if (really_expand)
1669 expand_one_hard_reg_var (var);
1670 if (!DECL_HARD_REGISTER (var))
1671 /* Invalid register specification. */
1672 expand_one_error_var (var);
1675 else if (use_register_for_decl (var))
1677 if (really_expand)
1678 expand_one_register_var (origvar);
1680 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1681 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1683 /* Reject variables which cover more than half of the address-space. */
1684 if (really_expand)
1686 if (DECL_NONLOCAL_FRAME (var))
1687 error_at (DECL_SOURCE_LOCATION (current_function_decl),
1688 "total size of local objects is too large");
1689 else
1690 error_at (DECL_SOURCE_LOCATION (var),
1691 "size of variable %q+D is too large", var);
1692 expand_one_error_var (var);
1695 else if (defer_stack_allocation (var, toplevel))
1696 add_stack_var (origvar);
1697 else
1699 if (really_expand)
1701 if (lookup_attribute ("naked",
1702 DECL_ATTRIBUTES (current_function_decl)))
1703 error ("cannot allocate stack for variable %q+D, naked function.",
1704 var);
1706 expand_one_stack_var (origvar);
1708 return size;
1710 return 0;
1713 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1714 expanding variables. Those variables that can be put into registers
1715 are allocated pseudos; those that can't are put on the stack.
1717 TOPLEVEL is true if this is the outermost BLOCK. */
1719 static void
1720 expand_used_vars_for_block (tree block, bool toplevel)
1722 tree t;
1724 /* Expand all variables at this level. */
1725 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1726 if (TREE_USED (t)
1727 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1728 || !DECL_NONSHAREABLE (t)))
1729 expand_one_var (t, toplevel, true);
1731 /* Expand all variables at containing levels. */
1732 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1733 expand_used_vars_for_block (t, false);
1736 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1737 and clear TREE_USED on all local variables. */
1739 static void
1740 clear_tree_used (tree block)
1742 tree t;
1744 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1745 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1746 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1747 || !DECL_NONSHAREABLE (t))
1748 TREE_USED (t) = 0;
1750 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1751 clear_tree_used (t);
1754 enum {
1755 SPCT_FLAG_DEFAULT = 1,
1756 SPCT_FLAG_ALL = 2,
1757 SPCT_FLAG_STRONG = 3,
1758 SPCT_FLAG_EXPLICIT = 4
1761 /* Examine TYPE and determine a bit mask of the following features. */
1763 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1764 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1765 #define SPCT_HAS_ARRAY 4
1766 #define SPCT_HAS_AGGREGATE 8
1768 static unsigned int
1769 stack_protect_classify_type (tree type)
1771 unsigned int ret = 0;
1772 tree t;
1774 switch (TREE_CODE (type))
1776 case ARRAY_TYPE:
1777 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1778 if (t == char_type_node
1779 || t == signed_char_type_node
1780 || t == unsigned_char_type_node)
1782 unsigned HOST_WIDE_INT max = PARAM_VALUE (PARAM_SSP_BUFFER_SIZE);
1783 unsigned HOST_WIDE_INT len;
1785 if (!TYPE_SIZE_UNIT (type)
1786 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1787 len = max;
1788 else
1789 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1791 if (len < max)
1792 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1793 else
1794 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1796 else
1797 ret = SPCT_HAS_ARRAY;
1798 break;
1800 case UNION_TYPE:
1801 case QUAL_UNION_TYPE:
1802 case RECORD_TYPE:
1803 ret = SPCT_HAS_AGGREGATE;
1804 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1805 if (TREE_CODE (t) == FIELD_DECL)
1806 ret |= stack_protect_classify_type (TREE_TYPE (t));
1807 break;
1809 default:
1810 break;
1813 return ret;
1816 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1817 part of the local stack frame. Remember if we ever return nonzero for
1818 any variable in this function. The return value is the phase number in
1819 which the variable should be allocated. */
1821 static int
1822 stack_protect_decl_phase (tree decl)
1824 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1825 int ret = 0;
1827 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1828 has_short_buffer = true;
1830 if (flag_stack_protect == SPCT_FLAG_ALL
1831 || flag_stack_protect == SPCT_FLAG_STRONG
1832 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1833 && lookup_attribute ("stack_protect",
1834 DECL_ATTRIBUTES (current_function_decl))))
1836 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1837 && !(bits & SPCT_HAS_AGGREGATE))
1838 ret = 1;
1839 else if (bits & SPCT_HAS_ARRAY)
1840 ret = 2;
1842 else
1843 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1845 if (ret)
1846 has_protected_decls = true;
1848 return ret;
1851 /* Two helper routines that check for phase 1 and phase 2. These are used
1852 as callbacks for expand_stack_vars. */
1854 static bool
1855 stack_protect_decl_phase_1 (size_t i)
1857 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1860 static bool
1861 stack_protect_decl_phase_2 (size_t i)
1863 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1866 /* And helper function that checks for asan phase (with stack protector
1867 it is phase 3). This is used as callback for expand_stack_vars.
1868 Returns true if any of the vars in the partition need to be protected. */
1870 static bool
1871 asan_decl_phase_3 (size_t i)
1873 while (i != EOC)
1875 if (asan_protect_stack_decl (stack_vars[i].decl))
1876 return true;
1877 i = stack_vars[i].next;
1879 return false;
1882 /* Ensure that variables in different stack protection phases conflict
1883 so that they are not merged and share the same stack slot. */
1885 static void
1886 add_stack_protection_conflicts (void)
1888 size_t i, j, n = stack_vars_num;
1889 unsigned char *phase;
1891 phase = XNEWVEC (unsigned char, n);
1892 for (i = 0; i < n; ++i)
1893 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1895 for (i = 0; i < n; ++i)
1897 unsigned char ph_i = phase[i];
1898 for (j = i + 1; j < n; ++j)
1899 if (ph_i != phase[j])
1900 add_stack_var_conflict (i, j);
1903 XDELETEVEC (phase);
1906 /* Create a decl for the guard at the top of the stack frame. */
1908 static void
1909 create_stack_guard (void)
1911 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1912 VAR_DECL, NULL, ptr_type_node);
1913 TREE_THIS_VOLATILE (guard) = 1;
1914 TREE_USED (guard) = 1;
1915 expand_one_stack_var (guard);
1916 crtl->stack_protect_guard = guard;
1919 /* Prepare for expanding variables. */
1920 static void
1921 init_vars_expansion (void)
1923 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1924 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1926 /* A map from decl to stack partition. */
1927 decl_to_stack_part = new hash_map<tree, size_t>;
1929 /* Initialize local stack smashing state. */
1930 has_protected_decls = false;
1931 has_short_buffer = false;
1934 /* Free up stack variable graph data. */
1935 static void
1936 fini_vars_expansion (void)
1938 bitmap_obstack_release (&stack_var_bitmap_obstack);
1939 if (stack_vars)
1940 XDELETEVEC (stack_vars);
1941 if (stack_vars_sorted)
1942 XDELETEVEC (stack_vars_sorted);
1943 stack_vars = NULL;
1944 stack_vars_sorted = NULL;
1945 stack_vars_alloc = stack_vars_num = 0;
1946 delete decl_to_stack_part;
1947 decl_to_stack_part = NULL;
1950 /* Make a fair guess for the size of the stack frame of the function
1951 in NODE. This doesn't have to be exact, the result is only used in
1952 the inline heuristics. So we don't want to run the full stack var
1953 packing algorithm (which is quadratic in the number of stack vars).
1954 Instead, we calculate the total size of all stack vars. This turns
1955 out to be a pretty fair estimate -- packing of stack vars doesn't
1956 happen very often. */
1958 HOST_WIDE_INT
1959 estimated_stack_frame_size (struct cgraph_node *node)
1961 poly_int64 size = 0;
1962 size_t i;
1963 tree var;
1964 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1966 push_cfun (fn);
1968 init_vars_expansion ();
1970 FOR_EACH_LOCAL_DECL (fn, i, var)
1971 if (auto_var_in_fn_p (var, fn->decl))
1972 size += expand_one_var (var, true, false);
1974 if (stack_vars_num > 0)
1976 /* Fake sorting the stack vars for account_stack_vars (). */
1977 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1978 for (i = 0; i < stack_vars_num; ++i)
1979 stack_vars_sorted[i] = i;
1980 size += account_stack_vars ();
1983 fini_vars_expansion ();
1984 pop_cfun ();
1985 return estimated_poly_value (size);
1988 /* Helper routine to check if a record or union contains an array field. */
1990 static int
1991 record_or_union_type_has_array_p (const_tree tree_type)
1993 tree fields = TYPE_FIELDS (tree_type);
1994 tree f;
1996 for (f = fields; f; f = DECL_CHAIN (f))
1997 if (TREE_CODE (f) == FIELD_DECL)
1999 tree field_type = TREE_TYPE (f);
2000 if (RECORD_OR_UNION_TYPE_P (field_type)
2001 && record_or_union_type_has_array_p (field_type))
2002 return 1;
2003 if (TREE_CODE (field_type) == ARRAY_TYPE)
2004 return 1;
2006 return 0;
2009 /* Check if the current function has local referenced variables that
2010 have their addresses taken, contain an array, or are arrays. */
2012 static bool
2013 stack_protect_decl_p ()
2015 unsigned i;
2016 tree var;
2018 FOR_EACH_LOCAL_DECL (cfun, i, var)
2019 if (!is_global_var (var))
2021 tree var_type = TREE_TYPE (var);
2022 if (VAR_P (var)
2023 && (TREE_CODE (var_type) == ARRAY_TYPE
2024 || TREE_ADDRESSABLE (var)
2025 || (RECORD_OR_UNION_TYPE_P (var_type)
2026 && record_or_union_type_has_array_p (var_type))))
2027 return true;
2029 return false;
2032 /* Check if the current function has calls that use a return slot. */
2034 static bool
2035 stack_protect_return_slot_p ()
2037 basic_block bb;
2039 FOR_ALL_BB_FN (bb, cfun)
2040 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2041 !gsi_end_p (gsi); gsi_next (&gsi))
2043 gimple *stmt = gsi_stmt (gsi);
2044 /* This assumes that calls to internal-only functions never
2045 use a return slot. */
2046 if (is_gimple_call (stmt)
2047 && !gimple_call_internal_p (stmt)
2048 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2049 gimple_call_fndecl (stmt)))
2050 return true;
2052 return false;
2055 /* Expand all variables used in the function. */
2057 static rtx_insn *
2058 expand_used_vars (void)
2060 tree var, outer_block = DECL_INITIAL (current_function_decl);
2061 auto_vec<tree> maybe_local_decls;
2062 rtx_insn *var_end_seq = NULL;
2063 unsigned i;
2064 unsigned len;
2065 bool gen_stack_protect_signal = false;
2067 /* Compute the phase of the stack frame for this function. */
2069 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2070 int off = targetm.starting_frame_offset () % align;
2071 frame_phase = off ? align - off : 0;
2074 /* Set TREE_USED on all variables in the local_decls. */
2075 FOR_EACH_LOCAL_DECL (cfun, i, var)
2076 TREE_USED (var) = 1;
2077 /* Clear TREE_USED on all variables associated with a block scope. */
2078 clear_tree_used (DECL_INITIAL (current_function_decl));
2080 init_vars_expansion ();
2082 if (targetm.use_pseudo_pic_reg ())
2083 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2085 for (i = 0; i < SA.map->num_partitions; i++)
2087 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2088 continue;
2090 tree var = partition_to_var (SA.map, i);
2092 gcc_assert (!virtual_operand_p (var));
2094 expand_one_ssa_partition (var);
2097 if (flag_stack_protect == SPCT_FLAG_STRONG)
2098 gen_stack_protect_signal
2099 = stack_protect_decl_p () || stack_protect_return_slot_p ();
2101 /* At this point all variables on the local_decls with TREE_USED
2102 set are not associated with any block scope. Lay them out. */
2104 len = vec_safe_length (cfun->local_decls);
2105 FOR_EACH_LOCAL_DECL (cfun, i, var)
2107 bool expand_now = false;
2109 /* Expanded above already. */
2110 if (is_gimple_reg (var))
2112 TREE_USED (var) = 0;
2113 goto next;
2115 /* We didn't set a block for static or extern because it's hard
2116 to tell the difference between a global variable (re)declared
2117 in a local scope, and one that's really declared there to
2118 begin with. And it doesn't really matter much, since we're
2119 not giving them stack space. Expand them now. */
2120 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2121 expand_now = true;
2123 /* Expand variables not associated with any block now. Those created by
2124 the optimizers could be live anywhere in the function. Those that
2125 could possibly have been scoped originally and detached from their
2126 block will have their allocation deferred so we coalesce them with
2127 others when optimization is enabled. */
2128 else if (TREE_USED (var))
2129 expand_now = true;
2131 /* Finally, mark all variables on the list as used. We'll use
2132 this in a moment when we expand those associated with scopes. */
2133 TREE_USED (var) = 1;
2135 if (expand_now)
2136 expand_one_var (var, true, true);
2138 next:
2139 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2141 rtx rtl = DECL_RTL_IF_SET (var);
2143 /* Keep artificial non-ignored vars in cfun->local_decls
2144 chain until instantiate_decls. */
2145 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2146 add_local_decl (cfun, var);
2147 else if (rtl == NULL_RTX)
2148 /* If rtl isn't set yet, which can happen e.g. with
2149 -fstack-protector, retry before returning from this
2150 function. */
2151 maybe_local_decls.safe_push (var);
2155 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2157 +-----------------+-----------------+
2158 | ...processed... | ...duplicates...|
2159 +-----------------+-----------------+
2161 +-- LEN points here.
2163 We just want the duplicates, as those are the artificial
2164 non-ignored vars that we want to keep until instantiate_decls.
2165 Move them down and truncate the array. */
2166 if (!vec_safe_is_empty (cfun->local_decls))
2167 cfun->local_decls->block_remove (0, len);
2169 /* At this point, all variables within the block tree with TREE_USED
2170 set are actually used by the optimized function. Lay them out. */
2171 expand_used_vars_for_block (outer_block, true);
2173 if (stack_vars_num > 0)
2175 add_scope_conflicts ();
2177 /* If stack protection is enabled, we don't share space between
2178 vulnerable data and non-vulnerable data. */
2179 if (flag_stack_protect != 0
2180 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2181 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2182 && lookup_attribute ("stack_protect",
2183 DECL_ATTRIBUTES (current_function_decl)))))
2184 add_stack_protection_conflicts ();
2186 /* Now that we have collected all stack variables, and have computed a
2187 minimal interference graph, attempt to save some stack space. */
2188 partition_stack_vars ();
2189 if (dump_file)
2190 dump_stack_var_partition ();
2193 switch (flag_stack_protect)
2195 case SPCT_FLAG_ALL:
2196 create_stack_guard ();
2197 break;
2199 case SPCT_FLAG_STRONG:
2200 if (gen_stack_protect_signal
2201 || cfun->calls_alloca || has_protected_decls
2202 || lookup_attribute ("stack_protect",
2203 DECL_ATTRIBUTES (current_function_decl)))
2204 create_stack_guard ();
2205 break;
2207 case SPCT_FLAG_DEFAULT:
2208 if (cfun->calls_alloca || has_protected_decls
2209 || lookup_attribute ("stack_protect",
2210 DECL_ATTRIBUTES (current_function_decl)))
2211 create_stack_guard ();
2212 break;
2214 case SPCT_FLAG_EXPLICIT:
2215 if (lookup_attribute ("stack_protect",
2216 DECL_ATTRIBUTES (current_function_decl)))
2217 create_stack_guard ();
2218 break;
2219 default:
2223 /* Assign rtl to each variable based on these partitions. */
2224 if (stack_vars_num > 0)
2226 struct stack_vars_data data;
2228 data.asan_base = NULL_RTX;
2229 data.asan_alignb = 0;
2231 /* Reorder decls to be protected by iterating over the variables
2232 array multiple times, and allocating out of each phase in turn. */
2233 /* ??? We could probably integrate this into the qsort we did
2234 earlier, such that we naturally see these variables first,
2235 and thus naturally allocate things in the right order. */
2236 if (has_protected_decls)
2238 /* Phase 1 contains only character arrays. */
2239 expand_stack_vars (stack_protect_decl_phase_1, &data);
2241 /* Phase 2 contains other kinds of arrays. */
2242 if (flag_stack_protect == SPCT_FLAG_ALL
2243 || flag_stack_protect == SPCT_FLAG_STRONG
2244 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2245 && lookup_attribute ("stack_protect",
2246 DECL_ATTRIBUTES (current_function_decl))))
2247 expand_stack_vars (stack_protect_decl_phase_2, &data);
2250 if (asan_sanitize_stack_p ())
2251 /* Phase 3, any partitions that need asan protection
2252 in addition to phase 1 and 2. */
2253 expand_stack_vars (asan_decl_phase_3, &data);
2255 /* ASAN description strings don't yet have a syntax for expressing
2256 polynomial offsets. */
2257 HOST_WIDE_INT prev_offset;
2258 if (!data.asan_vec.is_empty ()
2259 && frame_offset.is_constant (&prev_offset))
2261 HOST_WIDE_INT offset, sz, redzonesz;
2262 redzonesz = ASAN_RED_ZONE_SIZE;
2263 sz = data.asan_vec[0] - prev_offset;
2264 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2265 && data.asan_alignb <= 4096
2266 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2267 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2268 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2269 /* Allocating a constant amount of space from a constant
2270 starting offset must give a constant result. */
2271 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2272 .to_constant ());
2273 data.asan_vec.safe_push (prev_offset);
2274 data.asan_vec.safe_push (offset);
2275 /* Leave space for alignment if STRICT_ALIGNMENT. */
2276 if (STRICT_ALIGNMENT)
2277 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2278 << ASAN_SHADOW_SHIFT)
2279 / BITS_PER_UNIT, 1);
2281 var_end_seq
2282 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2283 data.asan_base,
2284 data.asan_alignb,
2285 data.asan_vec.address (),
2286 data.asan_decl_vec.address (),
2287 data.asan_vec.length ());
2290 expand_stack_vars (NULL, &data);
2293 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2294 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2295 virtual_stack_vars_rtx,
2296 var_end_seq);
2298 fini_vars_expansion ();
2300 /* If there were any artificial non-ignored vars without rtl
2301 found earlier, see if deferred stack allocation hasn't assigned
2302 rtl to them. */
2303 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2305 rtx rtl = DECL_RTL_IF_SET (var);
2307 /* Keep artificial non-ignored vars in cfun->local_decls
2308 chain until instantiate_decls. */
2309 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2310 add_local_decl (cfun, var);
2313 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2314 if (STACK_ALIGNMENT_NEEDED)
2316 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2317 if (FRAME_GROWS_DOWNWARD)
2318 frame_offset = aligned_lower_bound (frame_offset, align);
2319 else
2320 frame_offset = aligned_upper_bound (frame_offset, align);
2323 return var_end_seq;
2327 /* If we need to produce a detailed dump, print the tree representation
2328 for STMT to the dump file. SINCE is the last RTX after which the RTL
2329 generated for STMT should have been appended. */
2331 static void
2332 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2334 if (dump_file && (dump_flags & TDF_DETAILS))
2336 fprintf (dump_file, "\n;; ");
2337 print_gimple_stmt (dump_file, stmt, 0,
2338 TDF_SLIM | (dump_flags & TDF_LINENO));
2339 fprintf (dump_file, "\n");
2341 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2345 /* Maps the blocks that do not contain tree labels to rtx labels. */
2347 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2349 /* Returns the label_rtx expression for a label starting basic block BB. */
2351 static rtx_code_label *
2352 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2354 gimple_stmt_iterator gsi;
2355 tree lab;
2357 if (bb->flags & BB_RTL)
2358 return block_label (bb);
2360 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2361 if (elt)
2362 return *elt;
2364 /* Find the tree label if it is present. */
2366 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2368 glabel *lab_stmt;
2370 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2371 if (!lab_stmt)
2372 break;
2374 lab = gimple_label_label (lab_stmt);
2375 if (DECL_NONLOCAL (lab))
2376 break;
2378 return jump_target_rtx (lab);
2381 rtx_code_label *l = gen_label_rtx ();
2382 lab_rtx_for_bb->put (bb, l);
2383 return l;
2387 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2388 of a basic block where we just expanded the conditional at the end,
2389 possibly clean up the CFG and instruction sequence. LAST is the
2390 last instruction before the just emitted jump sequence. */
2392 static void
2393 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2395 /* Special case: when jumpif decides that the condition is
2396 trivial it emits an unconditional jump (and the necessary
2397 barrier). But we still have two edges, the fallthru one is
2398 wrong. purge_dead_edges would clean this up later. Unfortunately
2399 we have to insert insns (and split edges) before
2400 find_many_sub_basic_blocks and hence before purge_dead_edges.
2401 But splitting edges might create new blocks which depend on the
2402 fact that if there are two edges there's no barrier. So the
2403 barrier would get lost and verify_flow_info would ICE. Instead
2404 of auditing all edge splitters to care for the barrier (which
2405 normally isn't there in a cleaned CFG), fix it here. */
2406 if (BARRIER_P (get_last_insn ()))
2408 rtx_insn *insn;
2409 remove_edge (e);
2410 /* Now, we have a single successor block, if we have insns to
2411 insert on the remaining edge we potentially will insert
2412 it at the end of this block (if the dest block isn't feasible)
2413 in order to avoid splitting the edge. This insertion will take
2414 place in front of the last jump. But we might have emitted
2415 multiple jumps (conditional and one unconditional) to the
2416 same destination. Inserting in front of the last one then
2417 is a problem. See PR 40021. We fix this by deleting all
2418 jumps except the last unconditional one. */
2419 insn = PREV_INSN (get_last_insn ());
2420 /* Make sure we have an unconditional jump. Otherwise we're
2421 confused. */
2422 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2423 for (insn = PREV_INSN (insn); insn != last;)
2425 insn = PREV_INSN (insn);
2426 if (JUMP_P (NEXT_INSN (insn)))
2428 if (!any_condjump_p (NEXT_INSN (insn)))
2430 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2431 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2433 delete_insn (NEXT_INSN (insn));
2439 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2440 Returns a new basic block if we've terminated the current basic
2441 block and created a new one. */
2443 static basic_block
2444 expand_gimple_cond (basic_block bb, gcond *stmt)
2446 basic_block new_bb, dest;
2447 edge true_edge;
2448 edge false_edge;
2449 rtx_insn *last2, *last;
2450 enum tree_code code;
2451 tree op0, op1;
2453 code = gimple_cond_code (stmt);
2454 op0 = gimple_cond_lhs (stmt);
2455 op1 = gimple_cond_rhs (stmt);
2456 /* We're sometimes presented with such code:
2457 D.123_1 = x < y;
2458 if (D.123_1 != 0)
2460 This would expand to two comparisons which then later might
2461 be cleaned up by combine. But some pattern matchers like if-conversion
2462 work better when there's only one compare, so make up for this
2463 here as special exception if TER would have made the same change. */
2464 if (SA.values
2465 && TREE_CODE (op0) == SSA_NAME
2466 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2467 && TREE_CODE (op1) == INTEGER_CST
2468 && ((gimple_cond_code (stmt) == NE_EXPR
2469 && integer_zerop (op1))
2470 || (gimple_cond_code (stmt) == EQ_EXPR
2471 && integer_onep (op1)))
2472 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2474 gimple *second = SSA_NAME_DEF_STMT (op0);
2475 if (gimple_code (second) == GIMPLE_ASSIGN)
2477 enum tree_code code2 = gimple_assign_rhs_code (second);
2478 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2480 code = code2;
2481 op0 = gimple_assign_rhs1 (second);
2482 op1 = gimple_assign_rhs2 (second);
2484 /* If jumps are cheap and the target does not support conditional
2485 compare, turn some more codes into jumpy sequences. */
2486 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2487 && targetm.gen_ccmp_first == NULL)
2489 if ((code2 == BIT_AND_EXPR
2490 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2491 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2492 || code2 == TRUTH_AND_EXPR)
2494 code = TRUTH_ANDIF_EXPR;
2495 op0 = gimple_assign_rhs1 (second);
2496 op1 = gimple_assign_rhs2 (second);
2498 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2500 code = TRUTH_ORIF_EXPR;
2501 op0 = gimple_assign_rhs1 (second);
2502 op1 = gimple_assign_rhs2 (second);
2508 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2509 into (x - C2) * C3 < C4. */
2510 if ((code == EQ_EXPR || code == NE_EXPR)
2511 && TREE_CODE (op0) == SSA_NAME
2512 && TREE_CODE (op1) == INTEGER_CST)
2513 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2515 last2 = last = get_last_insn ();
2517 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2518 set_curr_insn_location (gimple_location (stmt));
2520 /* These flags have no purpose in RTL land. */
2521 true_edge->flags &= ~EDGE_TRUE_VALUE;
2522 false_edge->flags &= ~EDGE_FALSE_VALUE;
2524 /* We can either have a pure conditional jump with one fallthru edge or
2525 two-way jump that needs to be decomposed into two basic blocks. */
2526 if (false_edge->dest == bb->next_bb)
2528 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2529 true_edge->probability);
2530 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2531 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2532 set_curr_insn_location (true_edge->goto_locus);
2533 false_edge->flags |= EDGE_FALLTHRU;
2534 maybe_cleanup_end_of_block (false_edge, last);
2535 return NULL;
2537 if (true_edge->dest == bb->next_bb)
2539 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2540 false_edge->probability);
2541 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2542 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2543 set_curr_insn_location (false_edge->goto_locus);
2544 true_edge->flags |= EDGE_FALLTHRU;
2545 maybe_cleanup_end_of_block (true_edge, last);
2546 return NULL;
2549 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2550 true_edge->probability);
2551 last = get_last_insn ();
2552 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2553 set_curr_insn_location (false_edge->goto_locus);
2554 emit_jump (label_rtx_for_bb (false_edge->dest));
2556 BB_END (bb) = last;
2557 if (BARRIER_P (BB_END (bb)))
2558 BB_END (bb) = PREV_INSN (BB_END (bb));
2559 update_bb_for_insn (bb);
2561 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2562 dest = false_edge->dest;
2563 redirect_edge_succ (false_edge, new_bb);
2564 false_edge->flags |= EDGE_FALLTHRU;
2565 new_bb->count = false_edge->count ();
2566 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2567 add_bb_to_loop (new_bb, loop);
2568 if (loop->latch == bb
2569 && loop->header == dest)
2570 loop->latch = new_bb;
2571 make_single_succ_edge (new_bb, dest, 0);
2572 if (BARRIER_P (BB_END (new_bb)))
2573 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2574 update_bb_for_insn (new_bb);
2576 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2578 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2580 set_curr_insn_location (true_edge->goto_locus);
2581 true_edge->goto_locus = curr_insn_location ();
2584 return new_bb;
2587 /* Mark all calls that can have a transaction restart. */
2589 static void
2590 mark_transaction_restart_calls (gimple *stmt)
2592 struct tm_restart_node dummy;
2593 tm_restart_node **slot;
2595 if (!cfun->gimple_df->tm_restart)
2596 return;
2598 dummy.stmt = stmt;
2599 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2600 if (slot)
2602 struct tm_restart_node *n = *slot;
2603 tree list = n->label_or_list;
2604 rtx_insn *insn;
2606 for (insn = next_real_insn (get_last_insn ());
2607 !CALL_P (insn);
2608 insn = next_real_insn (insn))
2609 continue;
2611 if (TREE_CODE (list) == LABEL_DECL)
2612 add_reg_note (insn, REG_TM, label_rtx (list));
2613 else
2614 for (; list ; list = TREE_CHAIN (list))
2615 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2619 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2620 statement STMT. */
2622 static void
2623 expand_call_stmt (gcall *stmt)
2625 tree exp, decl, lhs;
2626 bool builtin_p;
2627 size_t i;
2629 if (gimple_call_internal_p (stmt))
2631 expand_internal_call (stmt);
2632 return;
2635 /* If this is a call to a built-in function and it has no effect other
2636 than setting the lhs, try to implement it using an internal function
2637 instead. */
2638 decl = gimple_call_fndecl (stmt);
2639 if (gimple_call_lhs (stmt)
2640 && !gimple_has_side_effects (stmt)
2641 && (optimize || (decl && called_as_built_in (decl))))
2643 internal_fn ifn = replacement_internal_fn (stmt);
2644 if (ifn != IFN_LAST)
2646 expand_internal_call (ifn, stmt);
2647 return;
2651 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2653 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2654 builtin_p = decl && fndecl_built_in_p (decl);
2656 /* If this is not a builtin function, the function type through which the
2657 call is made may be different from the type of the function. */
2658 if (!builtin_p)
2659 CALL_EXPR_FN (exp)
2660 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2661 CALL_EXPR_FN (exp));
2663 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2664 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2666 for (i = 0; i < gimple_call_num_args (stmt); i++)
2668 tree arg = gimple_call_arg (stmt, i);
2669 gimple *def;
2670 /* TER addresses into arguments of builtin functions so we have a
2671 chance to infer more correct alignment information. See PR39954. */
2672 if (builtin_p
2673 && TREE_CODE (arg) == SSA_NAME
2674 && (def = get_gimple_for_ssa_name (arg))
2675 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2676 arg = gimple_assign_rhs1 (def);
2677 CALL_EXPR_ARG (exp, i) = arg;
2680 if (gimple_has_side_effects (stmt))
2681 TREE_SIDE_EFFECTS (exp) = 1;
2683 if (gimple_call_nothrow_p (stmt))
2684 TREE_NOTHROW (exp) = 1;
2686 if (gimple_no_warning_p (stmt))
2687 TREE_NO_WARNING (exp) = 1;
2689 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2690 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2691 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2692 if (decl
2693 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2694 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2695 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2696 else
2697 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2698 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2699 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2700 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2702 /* Ensure RTL is created for debug args. */
2703 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2705 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2706 unsigned int ix;
2707 tree dtemp;
2709 if (debug_args)
2710 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2712 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2713 expand_debug_expr (dtemp);
2717 rtx_insn *before_call = get_last_insn ();
2718 lhs = gimple_call_lhs (stmt);
2719 if (lhs)
2720 expand_assignment (lhs, exp, false);
2721 else
2722 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2724 /* If the gimple call is an indirect call and has 'nocf_check'
2725 attribute find a generated CALL insn to mark it as no
2726 control-flow verification is needed. */
2727 if (gimple_call_nocf_check_p (stmt)
2728 && !gimple_call_fndecl (stmt))
2730 rtx_insn *last = get_last_insn ();
2731 while (!CALL_P (last)
2732 && last != before_call)
2733 last = PREV_INSN (last);
2735 if (last != before_call)
2736 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2739 mark_transaction_restart_calls (stmt);
2743 /* Generate RTL for an asm statement (explicit assembler code).
2744 STRING is a STRING_CST node containing the assembler code text,
2745 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2746 insn is volatile; don't optimize it. */
2748 static void
2749 expand_asm_loc (tree string, int vol, location_t locus)
2751 rtx body;
2753 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2754 ggc_strdup (TREE_STRING_POINTER (string)),
2755 locus);
2757 MEM_VOLATILE_P (body) = vol;
2759 /* Non-empty basic ASM implicitly clobbers memory. */
2760 if (TREE_STRING_LENGTH (string) != 0)
2762 rtx asm_op, clob;
2763 unsigned i, nclobbers;
2764 auto_vec<rtx> input_rvec, output_rvec;
2765 auto_vec<const char *> constraints;
2766 auto_vec<rtx> clobber_rvec;
2767 HARD_REG_SET clobbered_regs;
2768 CLEAR_HARD_REG_SET (clobbered_regs);
2770 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2771 clobber_rvec.safe_push (clob);
2773 if (targetm.md_asm_adjust)
2774 targetm.md_asm_adjust (output_rvec, input_rvec,
2775 constraints, clobber_rvec,
2776 clobbered_regs);
2778 asm_op = body;
2779 nclobbers = clobber_rvec.length ();
2780 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nclobbers));
2782 XVECEXP (body, 0, 0) = asm_op;
2783 for (i = 0; i < nclobbers; i++)
2784 XVECEXP (body, 0, i + 1) = gen_rtx_CLOBBER (VOIDmode, clobber_rvec[i]);
2787 emit_insn (body);
2790 /* Return the number of times character C occurs in string S. */
2791 static int
2792 n_occurrences (int c, const char *s)
2794 int n = 0;
2795 while (*s)
2796 n += (*s++ == c);
2797 return n;
2800 /* A subroutine of expand_asm_operands. Check that all operands have
2801 the same number of alternatives. Return true if so. */
2803 static bool
2804 check_operand_nalternatives (const vec<const char *> &constraints)
2806 unsigned len = constraints.length();
2807 if (len > 0)
2809 int nalternatives = n_occurrences (',', constraints[0]);
2811 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2813 error ("too many alternatives in %<asm%>");
2814 return false;
2817 for (unsigned i = 1; i < len; ++i)
2818 if (n_occurrences (',', constraints[i]) != nalternatives)
2820 error ("operand constraints for %<asm%> differ "
2821 "in number of alternatives");
2822 return false;
2825 return true;
2828 /* Check for overlap between registers marked in CLOBBERED_REGS and
2829 anything inappropriate in T. Emit error and return the register
2830 variable definition for error, NULL_TREE for ok. */
2832 static bool
2833 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2835 /* Conflicts between asm-declared register variables and the clobber
2836 list are not allowed. */
2837 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2839 if (overlap)
2841 error ("asm-specifier for variable %qE conflicts with asm clobber list",
2842 DECL_NAME (overlap));
2844 /* Reset registerness to stop multiple errors emitted for a single
2845 variable. */
2846 DECL_REGISTER (overlap) = 0;
2847 return true;
2850 return false;
2853 /* Generate RTL for an asm statement with arguments.
2854 STRING is the instruction template.
2855 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2856 Each output or input has an expression in the TREE_VALUE and
2857 a tree list in TREE_PURPOSE which in turn contains a constraint
2858 name in TREE_VALUE (or NULL_TREE) and a constraint string
2859 in TREE_PURPOSE.
2860 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2861 that is clobbered by this insn.
2863 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2864 should be the fallthru basic block of the asm goto.
2866 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2867 Some elements of OUTPUTS may be replaced with trees representing temporary
2868 values. The caller should copy those temporary values to the originally
2869 specified lvalues.
2871 VOL nonzero means the insn is volatile; don't optimize it. */
2873 static void
2874 expand_asm_stmt (gasm *stmt)
2876 class save_input_location
2878 location_t old;
2880 public:
2881 explicit save_input_location(location_t where)
2883 old = input_location;
2884 input_location = where;
2887 ~save_input_location()
2889 input_location = old;
2893 location_t locus = gimple_location (stmt);
2895 if (gimple_asm_input_p (stmt))
2897 const char *s = gimple_asm_string (stmt);
2898 tree string = build_string (strlen (s), s);
2899 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
2900 return;
2903 /* There are some legacy diagnostics in here, and also avoids a
2904 sixth parameger to targetm.md_asm_adjust. */
2905 save_input_location s_i_l(locus);
2907 unsigned noutputs = gimple_asm_noutputs (stmt);
2908 unsigned ninputs = gimple_asm_ninputs (stmt);
2909 unsigned nlabels = gimple_asm_nlabels (stmt);
2910 unsigned i;
2912 /* ??? Diagnose during gimplification? */
2913 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
2915 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2916 return;
2919 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
2920 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
2921 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
2923 /* Copy the gimple vectors into new vectors that we can manipulate. */
2925 output_tvec.safe_grow (noutputs);
2926 input_tvec.safe_grow (ninputs);
2927 constraints.safe_grow (noutputs + ninputs);
2929 for (i = 0; i < noutputs; ++i)
2931 tree t = gimple_asm_output_op (stmt, i);
2932 output_tvec[i] = TREE_VALUE (t);
2933 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2935 for (i = 0; i < ninputs; i++)
2937 tree t = gimple_asm_input_op (stmt, i);
2938 input_tvec[i] = TREE_VALUE (t);
2939 constraints[i + noutputs]
2940 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2943 /* ??? Diagnose during gimplification? */
2944 if (! check_operand_nalternatives (constraints))
2945 return;
2947 /* Count the number of meaningful clobbered registers, ignoring what
2948 we would ignore later. */
2949 auto_vec<rtx> clobber_rvec;
2950 HARD_REG_SET clobbered_regs;
2951 CLEAR_HARD_REG_SET (clobbered_regs);
2953 if (unsigned n = gimple_asm_nclobbers (stmt))
2955 clobber_rvec.reserve (n);
2956 for (i = 0; i < n; i++)
2958 tree t = gimple_asm_clobber_op (stmt, i);
2959 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
2960 int nregs, j;
2962 j = decode_reg_name_and_count (regname, &nregs);
2963 if (j < 0)
2965 if (j == -2)
2967 /* ??? Diagnose during gimplification? */
2968 error ("unknown register name %qs in %<asm%>", regname);
2970 else if (j == -4)
2972 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2973 clobber_rvec.safe_push (x);
2975 else
2977 /* Otherwise we should have -1 == empty string
2978 or -3 == cc, which is not a register. */
2979 gcc_assert (j == -1 || j == -3);
2982 else
2983 for (int reg = j; reg < j + nregs; reg++)
2985 /* Clobbering the PIC register is an error. */
2986 if (reg == (int) PIC_OFFSET_TABLE_REGNUM)
2988 /* ??? Diagnose during gimplification? */
2989 error ("PIC register clobbered by %qs in %<asm%>",
2990 regname);
2991 return;
2994 SET_HARD_REG_BIT (clobbered_regs, reg);
2995 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
2996 clobber_rvec.safe_push (x);
3000 unsigned nclobbers = clobber_rvec.length();
3002 /* First pass over inputs and outputs checks validity and sets
3003 mark_addressable if needed. */
3004 /* ??? Diagnose during gimplification? */
3006 for (i = 0; i < noutputs; ++i)
3008 tree val = output_tvec[i];
3009 tree type = TREE_TYPE (val);
3010 const char *constraint;
3011 bool is_inout;
3012 bool allows_reg;
3013 bool allows_mem;
3015 /* Try to parse the output constraint. If that fails, there's
3016 no point in going further. */
3017 constraint = constraints[i];
3018 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
3019 &allows_mem, &allows_reg, &is_inout))
3020 return;
3022 /* If the output is a hard register, verify it doesn't conflict with
3023 any other operand's possible hard register use. */
3024 if (DECL_P (val)
3025 && REG_P (DECL_RTL (val))
3026 && HARD_REGISTER_P (DECL_RTL (val)))
3028 unsigned j, output_hregno = REGNO (DECL_RTL (val));
3029 bool early_clobber_p = strchr (constraints[i], '&') != NULL;
3030 unsigned long match;
3032 /* Verify the other outputs do not use the same hard register. */
3033 for (j = i + 1; j < noutputs; ++j)
3034 if (DECL_P (output_tvec[j])
3035 && REG_P (DECL_RTL (output_tvec[j]))
3036 && HARD_REGISTER_P (DECL_RTL (output_tvec[j]))
3037 && output_hregno == REGNO (DECL_RTL (output_tvec[j])))
3038 error ("invalid hard register usage between output operands");
3040 /* Verify matching constraint operands use the same hard register
3041 and that the non-matching constraint operands do not use the same
3042 hard register if the output is an early clobber operand. */
3043 for (j = 0; j < ninputs; ++j)
3044 if (DECL_P (input_tvec[j])
3045 && REG_P (DECL_RTL (input_tvec[j]))
3046 && HARD_REGISTER_P (DECL_RTL (input_tvec[j])))
3048 unsigned input_hregno = REGNO (DECL_RTL (input_tvec[j]));
3049 switch (*constraints[j + noutputs])
3051 case '0': case '1': case '2': case '3': case '4':
3052 case '5': case '6': case '7': case '8': case '9':
3053 match = strtoul (constraints[j + noutputs], NULL, 10);
3054 break;
3055 default:
3056 match = ULONG_MAX;
3057 break;
3059 if (i == match
3060 && output_hregno != input_hregno)
3061 error ("invalid hard register usage between output operand "
3062 "and matching constraint operand");
3063 else if (early_clobber_p
3064 && i != match
3065 && output_hregno == input_hregno)
3066 error ("invalid hard register usage between earlyclobber "
3067 "operand and input operand");
3071 if (! allows_reg
3072 && (allows_mem
3073 || is_inout
3074 || (DECL_P (val)
3075 && REG_P (DECL_RTL (val))
3076 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3077 mark_addressable (val);
3080 for (i = 0; i < ninputs; ++i)
3082 bool allows_reg, allows_mem;
3083 const char *constraint;
3085 constraint = constraints[i + noutputs];
3086 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3087 constraints.address (),
3088 &allows_mem, &allows_reg))
3089 return;
3091 if (! allows_reg && allows_mem)
3092 mark_addressable (input_tvec[i]);
3095 /* Second pass evaluates arguments. */
3097 /* Make sure stack is consistent for asm goto. */
3098 if (nlabels > 0)
3099 do_pending_stack_adjust ();
3100 int old_generating_concat_p = generating_concat_p;
3102 /* Vector of RTX's of evaluated output operands. */
3103 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3104 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3105 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3107 output_rvec.safe_grow (noutputs);
3109 for (i = 0; i < noutputs; ++i)
3111 tree val = output_tvec[i];
3112 tree type = TREE_TYPE (val);
3113 bool is_inout, allows_reg, allows_mem, ok;
3114 rtx op;
3116 ok = parse_output_constraint (&constraints[i], i, ninputs,
3117 noutputs, &allows_mem, &allows_reg,
3118 &is_inout);
3119 gcc_assert (ok);
3121 /* If an output operand is not a decl or indirect ref and our constraint
3122 allows a register, make a temporary to act as an intermediate.
3123 Make the asm insn write into that, then we will copy it to
3124 the real output operand. Likewise for promoted variables. */
3126 generating_concat_p = 0;
3128 if ((TREE_CODE (val) == INDIRECT_REF && allows_mem)
3129 || (DECL_P (val)
3130 && (allows_mem || REG_P (DECL_RTL (val)))
3131 && ! (REG_P (DECL_RTL (val))
3132 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3133 || ! allows_reg
3134 || is_inout
3135 || TREE_ADDRESSABLE (type))
3137 op = expand_expr (val, NULL_RTX, VOIDmode,
3138 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3139 if (MEM_P (op))
3140 op = validize_mem (op);
3142 if (! allows_reg && !MEM_P (op))
3143 error ("output number %d not directly addressable", i);
3144 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3145 || GET_CODE (op) == CONCAT)
3147 rtx old_op = op;
3148 op = gen_reg_rtx (GET_MODE (op));
3150 generating_concat_p = old_generating_concat_p;
3152 if (is_inout)
3153 emit_move_insn (op, old_op);
3155 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3156 emit_move_insn (old_op, op);
3157 after_rtl_seq = get_insns ();
3158 after_rtl_end = get_last_insn ();
3159 end_sequence ();
3162 else
3164 op = assign_temp (type, 0, 1);
3165 op = validize_mem (op);
3166 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3167 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3169 generating_concat_p = old_generating_concat_p;
3171 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3172 expand_assignment (val, make_tree (type, op), false);
3173 after_rtl_seq = get_insns ();
3174 after_rtl_end = get_last_insn ();
3175 end_sequence ();
3177 output_rvec[i] = op;
3179 if (is_inout)
3180 inout_opnum.safe_push (i);
3183 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3184 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3186 input_rvec.safe_grow (ninputs);
3187 input_mode.safe_grow (ninputs);
3189 generating_concat_p = 0;
3191 for (i = 0; i < ninputs; ++i)
3193 tree val = input_tvec[i];
3194 tree type = TREE_TYPE (val);
3195 bool allows_reg, allows_mem, ok;
3196 const char *constraint;
3197 rtx op;
3199 constraint = constraints[i + noutputs];
3200 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3201 constraints.address (),
3202 &allows_mem, &allows_reg);
3203 gcc_assert (ok);
3205 /* EXPAND_INITIALIZER will not generate code for valid initializer
3206 constants, but will still generate code for other types of operand.
3207 This is the behavior we want for constant constraints. */
3208 op = expand_expr (val, NULL_RTX, VOIDmode,
3209 allows_reg ? EXPAND_NORMAL
3210 : allows_mem ? EXPAND_MEMORY
3211 : EXPAND_INITIALIZER);
3213 /* Never pass a CONCAT to an ASM. */
3214 if (GET_CODE (op) == CONCAT)
3215 op = force_reg (GET_MODE (op), op);
3216 else if (MEM_P (op))
3217 op = validize_mem (op);
3219 if (asm_operand_ok (op, constraint, NULL) <= 0)
3221 if (allows_reg && TYPE_MODE (type) != BLKmode)
3222 op = force_reg (TYPE_MODE (type), op);
3223 else if (!allows_mem)
3224 warning (0, "asm operand %d probably doesn%'t match constraints",
3225 i + noutputs);
3226 else if (MEM_P (op))
3228 /* We won't recognize either volatile memory or memory
3229 with a queued address as available a memory_operand
3230 at this point. Ignore it: clearly this *is* a memory. */
3232 else
3233 gcc_unreachable ();
3235 input_rvec[i] = op;
3236 input_mode[i] = TYPE_MODE (type);
3239 /* For in-out operands, copy output rtx to input rtx. */
3240 unsigned ninout = inout_opnum.length();
3241 for (i = 0; i < ninout; i++)
3243 int j = inout_opnum[i];
3244 rtx o = output_rvec[j];
3246 input_rvec.safe_push (o);
3247 input_mode.safe_push (GET_MODE (o));
3249 char buffer[16];
3250 sprintf (buffer, "%d", j);
3251 constraints.safe_push (ggc_strdup (buffer));
3253 ninputs += ninout;
3255 /* Sometimes we wish to automatically clobber registers across an asm.
3256 Case in point is when the i386 backend moved from cc0 to a hard reg --
3257 maintaining source-level compatibility means automatically clobbering
3258 the flags register. */
3259 rtx_insn *after_md_seq = NULL;
3260 if (targetm.md_asm_adjust)
3261 after_md_seq = targetm.md_asm_adjust (output_rvec, input_rvec,
3262 constraints, clobber_rvec,
3263 clobbered_regs);
3265 /* Do not allow the hook to change the output and input count,
3266 lest it mess up the operand numbering. */
3267 gcc_assert (output_rvec.length() == noutputs);
3268 gcc_assert (input_rvec.length() == ninputs);
3269 gcc_assert (constraints.length() == noutputs + ninputs);
3271 /* But it certainly can adjust the clobbers. */
3272 nclobbers = clobber_rvec.length();
3274 /* Third pass checks for easy conflicts. */
3275 /* ??? Why are we doing this on trees instead of rtx. */
3277 bool clobber_conflict_found = 0;
3278 for (i = 0; i < noutputs; ++i)
3279 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3280 clobber_conflict_found = 1;
3281 for (i = 0; i < ninputs - ninout; ++i)
3282 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3283 clobber_conflict_found = 1;
3285 /* Make vectors for the expression-rtx, constraint strings,
3286 and named operands. */
3288 rtvec argvec = rtvec_alloc (ninputs);
3289 rtvec constraintvec = rtvec_alloc (ninputs);
3290 rtvec labelvec = rtvec_alloc (nlabels);
3292 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3293 : GET_MODE (output_rvec[0])),
3294 ggc_strdup (gimple_asm_string (stmt)),
3295 "", 0, argvec, constraintvec,
3296 labelvec, locus);
3297 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3299 for (i = 0; i < ninputs; ++i)
3301 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3302 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3303 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3304 constraints[i + noutputs],
3305 locus);
3308 /* Copy labels to the vector. */
3309 rtx_code_label *fallthru_label = NULL;
3310 if (nlabels > 0)
3312 basic_block fallthru_bb = NULL;
3313 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3314 if (fallthru)
3315 fallthru_bb = fallthru->dest;
3317 for (i = 0; i < nlabels; ++i)
3319 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3320 rtx_insn *r;
3321 /* If asm goto has any labels in the fallthru basic block, use
3322 a label that we emit immediately after the asm goto. Expansion
3323 may insert further instructions into the same basic block after
3324 asm goto and if we don't do this, insertion of instructions on
3325 the fallthru edge might misbehave. See PR58670. */
3326 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3328 if (fallthru_label == NULL_RTX)
3329 fallthru_label = gen_label_rtx ();
3330 r = fallthru_label;
3332 else
3333 r = label_rtx (label);
3334 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3338 /* Now, for each output, construct an rtx
3339 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3340 ARGVEC CONSTRAINTS OPNAMES))
3341 If there is more than one, put them inside a PARALLEL. */
3343 if (nlabels > 0 && nclobbers == 0)
3345 gcc_assert (noutputs == 0);
3346 emit_jump_insn (body);
3348 else if (noutputs == 0 && nclobbers == 0)
3350 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3351 emit_insn (body);
3353 else if (noutputs == 1 && nclobbers == 0)
3355 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3356 emit_insn (gen_rtx_SET (output_rvec[0], body));
3358 else
3360 rtx obody = body;
3361 int num = noutputs;
3363 if (num == 0)
3364 num = 1;
3366 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3368 /* For each output operand, store a SET. */
3369 for (i = 0; i < noutputs; ++i)
3371 rtx src, o = output_rvec[i];
3372 if (i == 0)
3374 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3375 src = obody;
3377 else
3379 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3380 ASM_OPERANDS_TEMPLATE (obody),
3381 constraints[i], i, argvec,
3382 constraintvec, labelvec, locus);
3383 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3385 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3388 /* If there are no outputs (but there are some clobbers)
3389 store the bare ASM_OPERANDS into the PARALLEL. */
3390 if (i == 0)
3391 XVECEXP (body, 0, i++) = obody;
3393 /* Store (clobber REG) for each clobbered register specified. */
3394 for (unsigned j = 0; j < nclobbers; ++j)
3396 rtx clobbered_reg = clobber_rvec[j];
3398 /* Do sanity check for overlap between clobbers and respectively
3399 input and outputs that hasn't been handled. Such overlap
3400 should have been detected and reported above. */
3401 if (!clobber_conflict_found && REG_P (clobbered_reg))
3403 /* We test the old body (obody) contents to avoid
3404 tripping over the under-construction body. */
3405 for (unsigned k = 0; k < noutputs; ++k)
3406 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3407 internal_error ("asm clobber conflict with output operand");
3409 for (unsigned k = 0; k < ninputs - ninout; ++k)
3410 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3411 internal_error ("asm clobber conflict with input operand");
3414 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3417 if (nlabels > 0)
3418 emit_jump_insn (body);
3419 else
3420 emit_insn (body);
3423 generating_concat_p = old_generating_concat_p;
3425 if (fallthru_label)
3426 emit_label (fallthru_label);
3428 if (after_md_seq)
3429 emit_insn (after_md_seq);
3430 if (after_rtl_seq)
3431 emit_insn (after_rtl_seq);
3433 free_temp_slots ();
3434 crtl->has_asm_statement = 1;
3437 /* Emit code to jump to the address
3438 specified by the pointer expression EXP. */
3440 static void
3441 expand_computed_goto (tree exp)
3443 rtx x = expand_normal (exp);
3445 do_pending_stack_adjust ();
3446 emit_indirect_jump (x);
3449 /* Generate RTL code for a `goto' statement with target label LABEL.
3450 LABEL should be a LABEL_DECL tree node that was or will later be
3451 defined with `expand_label'. */
3453 static void
3454 expand_goto (tree label)
3456 if (flag_checking)
3458 /* Check for a nonlocal goto to a containing function. Should have
3459 gotten translated to __builtin_nonlocal_goto. */
3460 tree context = decl_function_context (label);
3461 gcc_assert (!context || context == current_function_decl);
3464 emit_jump (jump_target_rtx (label));
3467 /* Output a return with no value. */
3469 static void
3470 expand_null_return_1 (void)
3472 clear_pending_stack_adjust ();
3473 do_pending_stack_adjust ();
3474 emit_jump (return_label);
3477 /* Generate RTL to return from the current function, with no value.
3478 (That is, we do not do anything about returning any value.) */
3480 void
3481 expand_null_return (void)
3483 /* If this function was declared to return a value, but we
3484 didn't, clobber the return registers so that they are not
3485 propagated live to the rest of the function. */
3486 clobber_return_register ();
3488 expand_null_return_1 ();
3491 /* Generate RTL to return from the current function, with value VAL. */
3493 static void
3494 expand_value_return (rtx val)
3496 /* Copy the value to the return location unless it's already there. */
3498 tree decl = DECL_RESULT (current_function_decl);
3499 rtx return_reg = DECL_RTL (decl);
3500 if (return_reg != val)
3502 tree funtype = TREE_TYPE (current_function_decl);
3503 tree type = TREE_TYPE (decl);
3504 int unsignedp = TYPE_UNSIGNED (type);
3505 machine_mode old_mode = DECL_MODE (decl);
3506 machine_mode mode;
3507 if (DECL_BY_REFERENCE (decl))
3508 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3509 else
3510 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3512 if (mode != old_mode)
3513 val = convert_modes (mode, old_mode, val, unsignedp);
3515 if (GET_CODE (return_reg) == PARALLEL)
3516 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3517 else
3518 emit_move_insn (return_reg, val);
3521 expand_null_return_1 ();
3524 /* Generate RTL to evaluate the expression RETVAL and return it
3525 from the current function. */
3527 static void
3528 expand_return (tree retval)
3530 rtx result_rtl;
3531 rtx val = 0;
3532 tree retval_rhs;
3534 /* If function wants no value, give it none. */
3535 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3537 expand_normal (retval);
3538 expand_null_return ();
3539 return;
3542 if (retval == error_mark_node)
3544 /* Treat this like a return of no value from a function that
3545 returns a value. */
3546 expand_null_return ();
3547 return;
3549 else if ((TREE_CODE (retval) == MODIFY_EXPR
3550 || TREE_CODE (retval) == INIT_EXPR)
3551 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3552 retval_rhs = TREE_OPERAND (retval, 1);
3553 else
3554 retval_rhs = retval;
3556 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3558 /* If we are returning the RESULT_DECL, then the value has already
3559 been stored into it, so we don't have to do anything special. */
3560 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3561 expand_value_return (result_rtl);
3563 /* If the result is an aggregate that is being returned in one (or more)
3564 registers, load the registers here. */
3566 else if (retval_rhs != 0
3567 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3568 && REG_P (result_rtl))
3570 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3571 if (val)
3573 /* Use the mode of the result value on the return register. */
3574 PUT_MODE (result_rtl, GET_MODE (val));
3575 expand_value_return (val);
3577 else
3578 expand_null_return ();
3580 else if (retval_rhs != 0
3581 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3582 && (REG_P (result_rtl)
3583 || (GET_CODE (result_rtl) == PARALLEL)))
3585 /* Compute the return value into a temporary (usually a pseudo reg). */
3587 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3588 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3589 val = force_not_mem (val);
3590 expand_value_return (val);
3592 else
3594 /* No hard reg used; calculate value into hard return reg. */
3595 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3596 expand_value_return (result_rtl);
3600 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3601 register, tell the rtl optimizers that its value is no longer
3602 needed. */
3604 static void
3605 expand_clobber (tree lhs)
3607 if (DECL_P (lhs))
3609 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3610 if (decl_rtl && REG_P (decl_rtl))
3612 machine_mode decl_mode = GET_MODE (decl_rtl);
3613 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3614 REGMODE_NATURAL_SIZE (decl_mode)))
3615 emit_clobber (decl_rtl);
3620 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3621 STMT that doesn't require special handling for outgoing edges. That
3622 is no tailcalls and no GIMPLE_COND. */
3624 static void
3625 expand_gimple_stmt_1 (gimple *stmt)
3627 tree op0;
3629 set_curr_insn_location (gimple_location (stmt));
3631 switch (gimple_code (stmt))
3633 case GIMPLE_GOTO:
3634 op0 = gimple_goto_dest (stmt);
3635 if (TREE_CODE (op0) == LABEL_DECL)
3636 expand_goto (op0);
3637 else
3638 expand_computed_goto (op0);
3639 break;
3640 case GIMPLE_LABEL:
3641 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3642 break;
3643 case GIMPLE_NOP:
3644 case GIMPLE_PREDICT:
3645 break;
3646 case GIMPLE_SWITCH:
3648 gswitch *swtch = as_a <gswitch *> (stmt);
3649 if (gimple_switch_num_labels (swtch) == 1)
3650 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3651 else
3652 expand_case (swtch);
3654 break;
3655 case GIMPLE_ASM:
3656 expand_asm_stmt (as_a <gasm *> (stmt));
3657 break;
3658 case GIMPLE_CALL:
3659 expand_call_stmt (as_a <gcall *> (stmt));
3660 break;
3662 case GIMPLE_RETURN:
3664 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3666 if (op0 && op0 != error_mark_node)
3668 tree result = DECL_RESULT (current_function_decl);
3670 /* If we are not returning the current function's RESULT_DECL,
3671 build an assignment to it. */
3672 if (op0 != result)
3674 /* I believe that a function's RESULT_DECL is unique. */
3675 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3677 /* ??? We'd like to use simply expand_assignment here,
3678 but this fails if the value is of BLKmode but the return
3679 decl is a register. expand_return has special handling
3680 for this combination, which eventually should move
3681 to common code. See comments there. Until then, let's
3682 build a modify expression :-/ */
3683 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3684 result, op0);
3688 if (!op0)
3689 expand_null_return ();
3690 else
3691 expand_return (op0);
3693 break;
3695 case GIMPLE_ASSIGN:
3697 gassign *assign_stmt = as_a <gassign *> (stmt);
3698 tree lhs = gimple_assign_lhs (assign_stmt);
3700 /* Tree expand used to fiddle with |= and &= of two bitfield
3701 COMPONENT_REFs here. This can't happen with gimple, the LHS
3702 of binary assigns must be a gimple reg. */
3704 if (TREE_CODE (lhs) != SSA_NAME
3705 || get_gimple_rhs_class (gimple_expr_code (stmt))
3706 == GIMPLE_SINGLE_RHS)
3708 tree rhs = gimple_assign_rhs1 (assign_stmt);
3709 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt))
3710 == GIMPLE_SINGLE_RHS);
3711 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3712 /* Do not put locations on possibly shared trees. */
3713 && !is_gimple_min_invariant (rhs))
3714 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3715 if (TREE_CLOBBER_P (rhs))
3716 /* This is a clobber to mark the going out of scope for
3717 this LHS. */
3718 expand_clobber (lhs);
3719 else
3720 expand_assignment (lhs, rhs,
3721 gimple_assign_nontemporal_move_p (
3722 assign_stmt));
3724 else
3726 rtx target, temp;
3727 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3728 struct separate_ops ops;
3729 bool promoted = false;
3731 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3732 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3733 promoted = true;
3735 ops.code = gimple_assign_rhs_code (assign_stmt);
3736 ops.type = TREE_TYPE (lhs);
3737 switch (get_gimple_rhs_class (ops.code))
3739 case GIMPLE_TERNARY_RHS:
3740 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3741 /* Fallthru */
3742 case GIMPLE_BINARY_RHS:
3743 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3744 /* Fallthru */
3745 case GIMPLE_UNARY_RHS:
3746 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3747 break;
3748 default:
3749 gcc_unreachable ();
3751 ops.location = gimple_location (stmt);
3753 /* If we want to use a nontemporal store, force the value to
3754 register first. If we store into a promoted register,
3755 don't directly expand to target. */
3756 temp = nontemporal || promoted ? NULL_RTX : target;
3757 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3758 EXPAND_NORMAL);
3760 if (temp == target)
3762 else if (promoted)
3764 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3765 /* If TEMP is a VOIDmode constant, use convert_modes to make
3766 sure that we properly convert it. */
3767 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3769 temp = convert_modes (GET_MODE (target),
3770 TYPE_MODE (ops.type),
3771 temp, unsignedp);
3772 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3773 GET_MODE (target), temp, unsignedp);
3776 convert_move (SUBREG_REG (target), temp, unsignedp);
3778 else if (nontemporal && emit_storent_insn (target, temp))
3780 else
3782 temp = force_operand (temp, target);
3783 if (temp != target)
3784 emit_move_insn (target, temp);
3788 break;
3790 default:
3791 gcc_unreachable ();
3795 /* Expand one gimple statement STMT and return the last RTL instruction
3796 before any of the newly generated ones.
3798 In addition to generating the necessary RTL instructions this also
3799 sets REG_EH_REGION notes if necessary and sets the current source
3800 location for diagnostics. */
3802 static rtx_insn *
3803 expand_gimple_stmt (gimple *stmt)
3805 location_t saved_location = input_location;
3806 rtx_insn *last = get_last_insn ();
3807 int lp_nr;
3809 gcc_assert (cfun);
3811 /* We need to save and restore the current source location so that errors
3812 discovered during expansion are emitted with the right location. But
3813 it would be better if the diagnostic routines used the source location
3814 embedded in the tree nodes rather than globals. */
3815 if (gimple_has_location (stmt))
3816 input_location = gimple_location (stmt);
3818 expand_gimple_stmt_1 (stmt);
3820 /* Free any temporaries used to evaluate this statement. */
3821 free_temp_slots ();
3823 input_location = saved_location;
3825 /* Mark all insns that may trap. */
3826 lp_nr = lookup_stmt_eh_lp (stmt);
3827 if (lp_nr)
3829 rtx_insn *insn;
3830 for (insn = next_real_insn (last); insn;
3831 insn = next_real_insn (insn))
3833 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3834 /* If we want exceptions for non-call insns, any
3835 may_trap_p instruction may throw. */
3836 && GET_CODE (PATTERN (insn)) != CLOBBER
3837 && GET_CODE (PATTERN (insn)) != CLOBBER_HIGH
3838 && GET_CODE (PATTERN (insn)) != USE
3839 && insn_could_throw_p (insn))
3840 make_reg_eh_region_note (insn, 0, lp_nr);
3844 return last;
3847 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3848 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3849 generated a tail call (something that might be denied by the ABI
3850 rules governing the call; see calls.c).
3852 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3853 can still reach the rest of BB. The case here is __builtin_sqrt,
3854 where the NaN result goes through the external function (with a
3855 tailcall) and the normal result happens via a sqrt instruction. */
3857 static basic_block
3858 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
3860 rtx_insn *last2, *last;
3861 edge e;
3862 edge_iterator ei;
3863 profile_probability probability;
3865 last2 = last = expand_gimple_stmt (stmt);
3867 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3868 if (CALL_P (last) && SIBLING_CALL_P (last))
3869 goto found;
3871 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3873 *can_fallthru = true;
3874 return NULL;
3876 found:
3877 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3878 Any instructions emitted here are about to be deleted. */
3879 do_pending_stack_adjust ();
3881 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3882 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3883 EH or abnormal edges, we shouldn't have created a tail call in
3884 the first place. So it seems to me we should just be removing
3885 all edges here, or redirecting the existing fallthru edge to
3886 the exit block. */
3888 probability = profile_probability::never ();
3890 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3892 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3894 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3895 e->dest->count -= e->count ();
3896 probability += e->probability;
3897 remove_edge (e);
3899 else
3900 ei_next (&ei);
3903 /* This is somewhat ugly: the call_expr expander often emits instructions
3904 after the sibcall (to perform the function return). These confuse the
3905 find_many_sub_basic_blocks code, so we need to get rid of these. */
3906 last = NEXT_INSN (last);
3907 gcc_assert (BARRIER_P (last));
3909 *can_fallthru = false;
3910 while (NEXT_INSN (last))
3912 /* For instance an sqrt builtin expander expands if with
3913 sibcall in the then and label for `else`. */
3914 if (LABEL_P (NEXT_INSN (last)))
3916 *can_fallthru = true;
3917 break;
3919 delete_insn (NEXT_INSN (last));
3922 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3923 | EDGE_SIBCALL);
3924 e->probability = probability;
3925 BB_END (bb) = last;
3926 update_bb_for_insn (bb);
3928 if (NEXT_INSN (last))
3930 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3932 last = BB_END (bb);
3933 if (BARRIER_P (last))
3934 BB_END (bb) = PREV_INSN (last);
3937 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3939 return bb;
3942 /* Return the difference between the floor and the truncated result of
3943 a signed division by OP1 with remainder MOD. */
3944 static rtx
3945 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3947 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
3948 return gen_rtx_IF_THEN_ELSE
3949 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3950 gen_rtx_IF_THEN_ELSE
3951 (mode, gen_rtx_LT (BImode,
3952 gen_rtx_DIV (mode, op1, mod),
3953 const0_rtx),
3954 constm1_rtx, const0_rtx),
3955 const0_rtx);
3958 /* Return the difference between the ceil and the truncated result of
3959 a signed division by OP1 with remainder MOD. */
3960 static rtx
3961 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3963 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
3964 return gen_rtx_IF_THEN_ELSE
3965 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3966 gen_rtx_IF_THEN_ELSE
3967 (mode, gen_rtx_GT (BImode,
3968 gen_rtx_DIV (mode, op1, mod),
3969 const0_rtx),
3970 const1_rtx, const0_rtx),
3971 const0_rtx);
3974 /* Return the difference between the ceil and the truncated result of
3975 an unsigned division by OP1 with remainder MOD. */
3976 static rtx
3977 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
3979 /* (mod != 0 ? 1 : 0) */
3980 return gen_rtx_IF_THEN_ELSE
3981 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3982 const1_rtx, const0_rtx);
3985 /* Return the difference between the rounded and the truncated result
3986 of a signed division by OP1 with remainder MOD. Halfway cases are
3987 rounded away from zero, rather than to the nearest even number. */
3988 static rtx
3989 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3991 /* (abs (mod) >= abs (op1) - abs (mod)
3992 ? (op1 / mod > 0 ? 1 : -1)
3993 : 0) */
3994 return gen_rtx_IF_THEN_ELSE
3995 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
3996 gen_rtx_MINUS (mode,
3997 gen_rtx_ABS (mode, op1),
3998 gen_rtx_ABS (mode, mod))),
3999 gen_rtx_IF_THEN_ELSE
4000 (mode, gen_rtx_GT (BImode,
4001 gen_rtx_DIV (mode, op1, mod),
4002 const0_rtx),
4003 const1_rtx, constm1_rtx),
4004 const0_rtx);
4007 /* Return the difference between the rounded and the truncated result
4008 of a unsigned division by OP1 with remainder MOD. Halfway cases
4009 are rounded away from zero, rather than to the nearest even
4010 number. */
4011 static rtx
4012 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
4014 /* (mod >= op1 - mod ? 1 : 0) */
4015 return gen_rtx_IF_THEN_ELSE
4016 (mode, gen_rtx_GE (BImode, mod,
4017 gen_rtx_MINUS (mode, op1, mod)),
4018 const1_rtx, const0_rtx);
4021 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
4022 any rtl. */
4024 static rtx
4025 convert_debug_memory_address (scalar_int_mode mode, rtx x,
4026 addr_space_t as)
4028 #ifndef POINTERS_EXTEND_UNSIGNED
4029 gcc_assert (mode == Pmode
4030 || mode == targetm.addr_space.address_mode (as));
4031 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
4032 #else
4033 rtx temp;
4035 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
4037 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
4038 return x;
4040 /* X must have some form of address mode already. */
4041 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
4042 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
4043 x = lowpart_subreg (mode, x, xmode);
4044 else if (POINTERS_EXTEND_UNSIGNED > 0)
4045 x = gen_rtx_ZERO_EXTEND (mode, x);
4046 else if (!POINTERS_EXTEND_UNSIGNED)
4047 x = gen_rtx_SIGN_EXTEND (mode, x);
4048 else
4050 switch (GET_CODE (x))
4052 case SUBREG:
4053 if ((SUBREG_PROMOTED_VAR_P (x)
4054 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
4055 || (GET_CODE (SUBREG_REG (x)) == PLUS
4056 && REG_P (XEXP (SUBREG_REG (x), 0))
4057 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
4058 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
4059 && GET_MODE (SUBREG_REG (x)) == mode)
4060 return SUBREG_REG (x);
4061 break;
4062 case LABEL_REF:
4063 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4064 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4065 return temp;
4066 case SYMBOL_REF:
4067 temp = shallow_copy_rtx (x);
4068 PUT_MODE (temp, mode);
4069 return temp;
4070 case CONST:
4071 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4072 if (temp)
4073 temp = gen_rtx_CONST (mode, temp);
4074 return temp;
4075 case PLUS:
4076 case MINUS:
4077 if (CONST_INT_P (XEXP (x, 1)))
4079 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4080 if (temp)
4081 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4083 break;
4084 default:
4085 break;
4087 /* Don't know how to express ptr_extend as operation in debug info. */
4088 return NULL;
4090 #endif /* POINTERS_EXTEND_UNSIGNED */
4092 return x;
4095 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4096 by avoid_deep_ter_for_debug. */
4098 static hash_map<tree, tree> *deep_ter_debug_map;
4100 /* Split too deep TER chains for debug stmts using debug temporaries. */
4102 static void
4103 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4105 use_operand_p use_p;
4106 ssa_op_iter iter;
4107 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4109 tree use = USE_FROM_PTR (use_p);
4110 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4111 continue;
4112 gimple *g = get_gimple_for_ssa_name (use);
4113 if (g == NULL)
4114 continue;
4115 if (depth > 6 && !stmt_ends_bb_p (g))
4117 if (deep_ter_debug_map == NULL)
4118 deep_ter_debug_map = new hash_map<tree, tree>;
4120 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4121 if (vexpr != NULL)
4122 continue;
4123 vexpr = make_node (DEBUG_EXPR_DECL);
4124 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4125 DECL_ARTIFICIAL (vexpr) = 1;
4126 TREE_TYPE (vexpr) = TREE_TYPE (use);
4127 SET_DECL_MODE (vexpr, TYPE_MODE (TREE_TYPE (use)));
4128 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4129 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4130 avoid_deep_ter_for_debug (def_temp, 0);
4132 else
4133 avoid_deep_ter_for_debug (g, depth + 1);
4137 /* Return an RTX equivalent to the value of the parameter DECL. */
4139 static rtx
4140 expand_debug_parm_decl (tree decl)
4142 rtx incoming = DECL_INCOMING_RTL (decl);
4144 if (incoming
4145 && GET_MODE (incoming) != BLKmode
4146 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4147 || (MEM_P (incoming)
4148 && REG_P (XEXP (incoming, 0))
4149 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4151 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4153 #ifdef HAVE_window_save
4154 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4155 If the target machine has an explicit window save instruction, the
4156 actual entry value is the corresponding OUTGOING_REGNO instead. */
4157 if (REG_P (incoming)
4158 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4159 incoming
4160 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4161 OUTGOING_REGNO (REGNO (incoming)), 0);
4162 else if (MEM_P (incoming))
4164 rtx reg = XEXP (incoming, 0);
4165 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4167 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4168 incoming = replace_equiv_address_nv (incoming, reg);
4170 else
4171 incoming = copy_rtx (incoming);
4173 #endif
4175 ENTRY_VALUE_EXP (rtl) = incoming;
4176 return rtl;
4179 if (incoming
4180 && GET_MODE (incoming) != BLKmode
4181 && !TREE_ADDRESSABLE (decl)
4182 && MEM_P (incoming)
4183 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4184 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4185 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4186 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4187 return copy_rtx (incoming);
4189 return NULL_RTX;
4192 /* Return an RTX equivalent to the value of the tree expression EXP. */
4194 static rtx
4195 expand_debug_expr (tree exp)
4197 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4198 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4199 machine_mode inner_mode = VOIDmode;
4200 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4201 addr_space_t as;
4202 scalar_int_mode op0_mode, op1_mode, addr_mode;
4204 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4206 case tcc_expression:
4207 switch (TREE_CODE (exp))
4209 case COND_EXPR:
4210 case DOT_PROD_EXPR:
4211 case SAD_EXPR:
4212 case WIDEN_MULT_PLUS_EXPR:
4213 case WIDEN_MULT_MINUS_EXPR:
4214 goto ternary;
4216 case TRUTH_ANDIF_EXPR:
4217 case TRUTH_ORIF_EXPR:
4218 case TRUTH_AND_EXPR:
4219 case TRUTH_OR_EXPR:
4220 case TRUTH_XOR_EXPR:
4221 goto binary;
4223 case TRUTH_NOT_EXPR:
4224 goto unary;
4226 default:
4227 break;
4229 break;
4231 ternary:
4232 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4233 if (!op2)
4234 return NULL_RTX;
4235 /* Fall through. */
4237 binary:
4238 case tcc_binary:
4239 if (mode == BLKmode)
4240 return NULL_RTX;
4241 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4242 if (!op1)
4243 return NULL_RTX;
4244 switch (TREE_CODE (exp))
4246 case LSHIFT_EXPR:
4247 case RSHIFT_EXPR:
4248 case LROTATE_EXPR:
4249 case RROTATE_EXPR:
4250 case WIDEN_LSHIFT_EXPR:
4251 /* Ensure second operand isn't wider than the first one. */
4252 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4253 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4254 && (GET_MODE_UNIT_PRECISION (mode)
4255 < GET_MODE_PRECISION (op1_mode)))
4256 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4257 break;
4258 default:
4259 break;
4261 /* Fall through. */
4263 unary:
4264 case tcc_unary:
4265 if (mode == BLKmode)
4266 return NULL_RTX;
4267 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4268 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4269 if (!op0)
4270 return NULL_RTX;
4271 break;
4273 case tcc_comparison:
4274 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4275 goto binary;
4277 case tcc_type:
4278 case tcc_statement:
4279 gcc_unreachable ();
4281 case tcc_constant:
4282 case tcc_exceptional:
4283 case tcc_declaration:
4284 case tcc_reference:
4285 case tcc_vl_exp:
4286 break;
4289 switch (TREE_CODE (exp))
4291 case STRING_CST:
4292 if (!lookup_constant_def (exp))
4294 if (strlen (TREE_STRING_POINTER (exp)) + 1
4295 != (size_t) TREE_STRING_LENGTH (exp))
4296 return NULL_RTX;
4297 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4298 op0 = gen_rtx_MEM (BLKmode, op0);
4299 set_mem_attributes (op0, exp, 0);
4300 return op0;
4302 /* Fall through. */
4304 case INTEGER_CST:
4305 case REAL_CST:
4306 case FIXED_CST:
4307 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4308 return op0;
4310 case POLY_INT_CST:
4311 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4313 case COMPLEX_CST:
4314 gcc_assert (COMPLEX_MODE_P (mode));
4315 op0 = expand_debug_expr (TREE_REALPART (exp));
4316 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4317 return gen_rtx_CONCAT (mode, op0, op1);
4319 case DEBUG_EXPR_DECL:
4320 op0 = DECL_RTL_IF_SET (exp);
4322 if (op0)
4323 return op0;
4325 op0 = gen_rtx_DEBUG_EXPR (mode);
4326 DEBUG_EXPR_TREE_DECL (op0) = exp;
4327 SET_DECL_RTL (exp, op0);
4329 return op0;
4331 case VAR_DECL:
4332 case PARM_DECL:
4333 case FUNCTION_DECL:
4334 case LABEL_DECL:
4335 case CONST_DECL:
4336 case RESULT_DECL:
4337 op0 = DECL_RTL_IF_SET (exp);
4339 /* This decl was probably optimized away. */
4340 if (!op0)
4342 if (!VAR_P (exp)
4343 || DECL_EXTERNAL (exp)
4344 || !TREE_STATIC (exp)
4345 || !DECL_NAME (exp)
4346 || DECL_HARD_REGISTER (exp)
4347 || DECL_IN_CONSTANT_POOL (exp)
4348 || mode == VOIDmode)
4349 return NULL;
4351 op0 = make_decl_rtl_for_debug (exp);
4352 if (!MEM_P (op0)
4353 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4354 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4355 return NULL;
4357 else
4358 op0 = copy_rtx (op0);
4360 if (GET_MODE (op0) == BLKmode
4361 /* If op0 is not BLKmode, but mode is, adjust_mode
4362 below would ICE. While it is likely a FE bug,
4363 try to be robust here. See PR43166. */
4364 || mode == BLKmode
4365 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4367 gcc_assert (MEM_P (op0));
4368 op0 = adjust_address_nv (op0, mode, 0);
4369 return op0;
4372 /* Fall through. */
4374 adjust_mode:
4375 case PAREN_EXPR:
4376 CASE_CONVERT:
4378 inner_mode = GET_MODE (op0);
4380 if (mode == inner_mode)
4381 return op0;
4383 if (inner_mode == VOIDmode)
4385 if (TREE_CODE (exp) == SSA_NAME)
4386 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4387 else
4388 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4389 if (mode == inner_mode)
4390 return op0;
4393 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4395 if (GET_MODE_UNIT_BITSIZE (mode)
4396 == GET_MODE_UNIT_BITSIZE (inner_mode))
4397 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4398 else if (GET_MODE_UNIT_BITSIZE (mode)
4399 < GET_MODE_UNIT_BITSIZE (inner_mode))
4400 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4401 else
4402 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4404 else if (FLOAT_MODE_P (mode))
4406 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4407 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4408 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4409 else
4410 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4412 else if (FLOAT_MODE_P (inner_mode))
4414 if (unsignedp)
4415 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4416 else
4417 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4419 else if (GET_MODE_UNIT_PRECISION (mode)
4420 == GET_MODE_UNIT_PRECISION (inner_mode))
4421 op0 = lowpart_subreg (mode, op0, inner_mode);
4422 else if (GET_MODE_UNIT_PRECISION (mode)
4423 < GET_MODE_UNIT_PRECISION (inner_mode))
4424 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4425 else if (UNARY_CLASS_P (exp)
4426 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4427 : unsignedp)
4428 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4429 else
4430 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4432 return op0;
4435 case MEM_REF:
4436 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4438 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4439 TREE_OPERAND (exp, 0),
4440 TREE_OPERAND (exp, 1));
4441 if (newexp)
4442 return expand_debug_expr (newexp);
4444 /* FALLTHROUGH */
4445 case INDIRECT_REF:
4446 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4447 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4448 if (!op0)
4449 return NULL;
4451 if (TREE_CODE (exp) == MEM_REF)
4453 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4454 || (GET_CODE (op0) == PLUS
4455 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4456 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4457 Instead just use get_inner_reference. */
4458 goto component_ref;
4460 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4461 poly_int64 offset;
4462 if (!op1 || !poly_int_rtx_p (op1, &offset))
4463 return NULL;
4465 op0 = plus_constant (inner_mode, op0, offset);
4468 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4470 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4471 op0, as);
4472 if (op0 == NULL_RTX)
4473 return NULL;
4475 op0 = gen_rtx_MEM (mode, op0);
4476 set_mem_attributes (op0, exp, 0);
4477 if (TREE_CODE (exp) == MEM_REF
4478 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4479 set_mem_expr (op0, NULL_TREE);
4480 set_mem_addr_space (op0, as);
4482 return op0;
4484 case TARGET_MEM_REF:
4485 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4486 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4487 return NULL;
4489 op0 = expand_debug_expr
4490 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4491 if (!op0)
4492 return NULL;
4494 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4495 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4496 op0, as);
4497 if (op0 == NULL_RTX)
4498 return NULL;
4500 op0 = gen_rtx_MEM (mode, op0);
4502 set_mem_attributes (op0, exp, 0);
4503 set_mem_addr_space (op0, as);
4505 return op0;
4507 component_ref:
4508 case ARRAY_REF:
4509 case ARRAY_RANGE_REF:
4510 case COMPONENT_REF:
4511 case BIT_FIELD_REF:
4512 case REALPART_EXPR:
4513 case IMAGPART_EXPR:
4514 case VIEW_CONVERT_EXPR:
4516 machine_mode mode1;
4517 poly_int64 bitsize, bitpos;
4518 tree offset;
4519 int reversep, volatilep = 0;
4520 tree tem
4521 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4522 &unsignedp, &reversep, &volatilep);
4523 rtx orig_op0;
4525 if (known_eq (bitsize, 0))
4526 return NULL;
4528 orig_op0 = op0 = expand_debug_expr (tem);
4530 if (!op0)
4531 return NULL;
4533 if (offset)
4535 machine_mode addrmode, offmode;
4537 if (!MEM_P (op0))
4538 return NULL;
4540 op0 = XEXP (op0, 0);
4541 addrmode = GET_MODE (op0);
4542 if (addrmode == VOIDmode)
4543 addrmode = Pmode;
4545 op1 = expand_debug_expr (offset);
4546 if (!op1)
4547 return NULL;
4549 offmode = GET_MODE (op1);
4550 if (offmode == VOIDmode)
4551 offmode = TYPE_MODE (TREE_TYPE (offset));
4553 if (addrmode != offmode)
4554 op1 = lowpart_subreg (addrmode, op1, offmode);
4556 /* Don't use offset_address here, we don't need a
4557 recognizable address, and we don't want to generate
4558 code. */
4559 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4560 op0, op1));
4563 if (MEM_P (op0))
4565 if (mode1 == VOIDmode)
4567 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4568 return NULL;
4569 /* Bitfield. */
4570 mode1 = smallest_int_mode_for_size (bitsize);
4572 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4573 if (maybe_ne (bytepos, 0))
4575 op0 = adjust_address_nv (op0, mode1, bytepos);
4576 bitpos = num_trailing_bits (bitpos);
4578 else if (known_eq (bitpos, 0)
4579 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4580 op0 = adjust_address_nv (op0, mode, 0);
4581 else if (GET_MODE (op0) != mode1)
4582 op0 = adjust_address_nv (op0, mode1, 0);
4583 else
4584 op0 = copy_rtx (op0);
4585 if (op0 == orig_op0)
4586 op0 = shallow_copy_rtx (op0);
4587 set_mem_attributes (op0, exp, 0);
4590 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4591 return op0;
4593 if (maybe_lt (bitpos, 0))
4594 return NULL;
4596 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4597 return NULL;
4599 poly_int64 bytepos;
4600 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4601 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4603 machine_mode opmode = GET_MODE (op0);
4605 if (opmode == VOIDmode)
4606 opmode = TYPE_MODE (TREE_TYPE (tem));
4608 /* This condition may hold if we're expanding the address
4609 right past the end of an array that turned out not to
4610 be addressable (i.e., the address was only computed in
4611 debug stmts). The gen_subreg below would rightfully
4612 crash, and the address doesn't really exist, so just
4613 drop it. */
4614 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4615 return NULL;
4617 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4618 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4621 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4622 && TYPE_UNSIGNED (TREE_TYPE (exp))
4623 ? SIGN_EXTRACT
4624 : ZERO_EXTRACT, mode,
4625 GET_MODE (op0) != VOIDmode
4626 ? GET_MODE (op0)
4627 : TYPE_MODE (TREE_TYPE (tem)),
4628 op0, gen_int_mode (bitsize, word_mode),
4629 gen_int_mode (bitpos, word_mode));
4632 case ABS_EXPR:
4633 case ABSU_EXPR:
4634 return simplify_gen_unary (ABS, mode, op0, mode);
4636 case NEGATE_EXPR:
4637 return simplify_gen_unary (NEG, mode, op0, mode);
4639 case BIT_NOT_EXPR:
4640 return simplify_gen_unary (NOT, mode, op0, mode);
4642 case FLOAT_EXPR:
4643 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4644 0)))
4645 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4646 inner_mode);
4648 case FIX_TRUNC_EXPR:
4649 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4650 inner_mode);
4652 case POINTER_PLUS_EXPR:
4653 /* For the rare target where pointers are not the same size as
4654 size_t, we need to check for mis-matched modes and correct
4655 the addend. */
4656 if (op0 && op1
4657 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4658 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4659 && op0_mode != op1_mode)
4661 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4662 /* If OP0 is a partial mode, then we must truncate, even
4663 if it has the same bitsize as OP1 as GCC's
4664 representation of partial modes is opaque. */
4665 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4666 && (GET_MODE_BITSIZE (op0_mode)
4667 == GET_MODE_BITSIZE (op1_mode))))
4668 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4669 else
4670 /* We always sign-extend, regardless of the signedness of
4671 the operand, because the operand is always unsigned
4672 here even if the original C expression is signed. */
4673 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4675 /* Fall through. */
4676 case PLUS_EXPR:
4677 return simplify_gen_binary (PLUS, mode, op0, op1);
4679 case MINUS_EXPR:
4680 case POINTER_DIFF_EXPR:
4681 return simplify_gen_binary (MINUS, mode, op0, op1);
4683 case MULT_EXPR:
4684 return simplify_gen_binary (MULT, mode, op0, op1);
4686 case RDIV_EXPR:
4687 case TRUNC_DIV_EXPR:
4688 case EXACT_DIV_EXPR:
4689 if (unsignedp)
4690 return simplify_gen_binary (UDIV, mode, op0, op1);
4691 else
4692 return simplify_gen_binary (DIV, mode, op0, op1);
4694 case TRUNC_MOD_EXPR:
4695 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4697 case FLOOR_DIV_EXPR:
4698 if (unsignedp)
4699 return simplify_gen_binary (UDIV, mode, op0, op1);
4700 else
4702 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4703 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4704 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4705 return simplify_gen_binary (PLUS, mode, div, adj);
4708 case FLOOR_MOD_EXPR:
4709 if (unsignedp)
4710 return simplify_gen_binary (UMOD, mode, op0, op1);
4711 else
4713 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4714 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4715 adj = simplify_gen_unary (NEG, mode,
4716 simplify_gen_binary (MULT, mode, adj, op1),
4717 mode);
4718 return simplify_gen_binary (PLUS, mode, mod, adj);
4721 case CEIL_DIV_EXPR:
4722 if (unsignedp)
4724 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4725 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4726 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4727 return simplify_gen_binary (PLUS, mode, div, adj);
4729 else
4731 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4732 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4733 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4734 return simplify_gen_binary (PLUS, mode, div, adj);
4737 case CEIL_MOD_EXPR:
4738 if (unsignedp)
4740 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4741 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4742 adj = simplify_gen_unary (NEG, mode,
4743 simplify_gen_binary (MULT, mode, adj, op1),
4744 mode);
4745 return simplify_gen_binary (PLUS, mode, mod, adj);
4747 else
4749 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4750 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4751 adj = simplify_gen_unary (NEG, mode,
4752 simplify_gen_binary (MULT, mode, adj, op1),
4753 mode);
4754 return simplify_gen_binary (PLUS, mode, mod, adj);
4757 case ROUND_DIV_EXPR:
4758 if (unsignedp)
4760 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4761 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4762 rtx adj = round_udiv_adjust (mode, mod, op1);
4763 return simplify_gen_binary (PLUS, mode, div, adj);
4765 else
4767 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4768 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4769 rtx adj = round_sdiv_adjust (mode, mod, op1);
4770 return simplify_gen_binary (PLUS, mode, div, adj);
4773 case ROUND_MOD_EXPR:
4774 if (unsignedp)
4776 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4777 rtx adj = round_udiv_adjust (mode, mod, op1);
4778 adj = simplify_gen_unary (NEG, mode,
4779 simplify_gen_binary (MULT, mode, adj, op1),
4780 mode);
4781 return simplify_gen_binary (PLUS, mode, mod, adj);
4783 else
4785 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4786 rtx adj = round_sdiv_adjust (mode, mod, op1);
4787 adj = simplify_gen_unary (NEG, mode,
4788 simplify_gen_binary (MULT, mode, adj, op1),
4789 mode);
4790 return simplify_gen_binary (PLUS, mode, mod, adj);
4793 case LSHIFT_EXPR:
4794 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4796 case RSHIFT_EXPR:
4797 if (unsignedp)
4798 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4799 else
4800 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4802 case LROTATE_EXPR:
4803 return simplify_gen_binary (ROTATE, mode, op0, op1);
4805 case RROTATE_EXPR:
4806 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4808 case MIN_EXPR:
4809 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4811 case MAX_EXPR:
4812 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4814 case BIT_AND_EXPR:
4815 case TRUTH_AND_EXPR:
4816 return simplify_gen_binary (AND, mode, op0, op1);
4818 case BIT_IOR_EXPR:
4819 case TRUTH_OR_EXPR:
4820 return simplify_gen_binary (IOR, mode, op0, op1);
4822 case BIT_XOR_EXPR:
4823 case TRUTH_XOR_EXPR:
4824 return simplify_gen_binary (XOR, mode, op0, op1);
4826 case TRUTH_ANDIF_EXPR:
4827 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4829 case TRUTH_ORIF_EXPR:
4830 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4832 case TRUTH_NOT_EXPR:
4833 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4835 case LT_EXPR:
4836 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4837 op0, op1);
4839 case LE_EXPR:
4840 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4841 op0, op1);
4843 case GT_EXPR:
4844 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4845 op0, op1);
4847 case GE_EXPR:
4848 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4849 op0, op1);
4851 case EQ_EXPR:
4852 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4854 case NE_EXPR:
4855 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4857 case UNORDERED_EXPR:
4858 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4860 case ORDERED_EXPR:
4861 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4863 case UNLT_EXPR:
4864 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4866 case UNLE_EXPR:
4867 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4869 case UNGT_EXPR:
4870 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4872 case UNGE_EXPR:
4873 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4875 case UNEQ_EXPR:
4876 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4878 case LTGT_EXPR:
4879 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4881 case COND_EXPR:
4882 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4884 case COMPLEX_EXPR:
4885 gcc_assert (COMPLEX_MODE_P (mode));
4886 if (GET_MODE (op0) == VOIDmode)
4887 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4888 if (GET_MODE (op1) == VOIDmode)
4889 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4890 return gen_rtx_CONCAT (mode, op0, op1);
4892 case CONJ_EXPR:
4893 if (GET_CODE (op0) == CONCAT)
4894 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4895 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4896 XEXP (op0, 1),
4897 GET_MODE_INNER (mode)));
4898 else
4900 scalar_mode imode = GET_MODE_INNER (mode);
4901 rtx re, im;
4903 if (MEM_P (op0))
4905 re = adjust_address_nv (op0, imode, 0);
4906 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4908 else
4910 scalar_int_mode ifmode;
4911 scalar_int_mode ihmode;
4912 rtx halfsize;
4913 if (!int_mode_for_mode (mode).exists (&ifmode)
4914 || !int_mode_for_mode (imode).exists (&ihmode))
4915 return NULL;
4916 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4917 re = op0;
4918 if (mode != ifmode)
4919 re = gen_rtx_SUBREG (ifmode, re, 0);
4920 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4921 if (imode != ihmode)
4922 re = gen_rtx_SUBREG (imode, re, 0);
4923 im = copy_rtx (op0);
4924 if (mode != ifmode)
4925 im = gen_rtx_SUBREG (ifmode, im, 0);
4926 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4927 if (imode != ihmode)
4928 im = gen_rtx_SUBREG (imode, im, 0);
4930 im = gen_rtx_NEG (imode, im);
4931 return gen_rtx_CONCAT (mode, re, im);
4934 case ADDR_EXPR:
4935 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4936 if (!op0 || !MEM_P (op0))
4938 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
4939 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
4940 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
4941 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
4942 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
4943 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
4945 if (handled_component_p (TREE_OPERAND (exp, 0)))
4947 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
4948 bool reverse;
4949 tree decl
4950 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
4951 &bitsize, &maxsize, &reverse);
4952 if ((VAR_P (decl)
4953 || TREE_CODE (decl) == PARM_DECL
4954 || TREE_CODE (decl) == RESULT_DECL)
4955 && (!TREE_ADDRESSABLE (decl)
4956 || target_for_debug_bind (decl))
4957 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
4958 && known_gt (bitsize, 0)
4959 && known_eq (bitsize, maxsize))
4961 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
4962 return plus_constant (mode, base, byteoffset);
4966 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
4967 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
4968 == ADDR_EXPR)
4970 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4971 0));
4972 if (op0 != NULL
4973 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4974 || (GET_CODE (op0) == PLUS
4975 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
4976 && CONST_INT_P (XEXP (op0, 1)))))
4978 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4979 1));
4980 poly_int64 offset;
4981 if (!op1 || !poly_int_rtx_p (op1, &offset))
4982 return NULL;
4984 return plus_constant (mode, op0, offset);
4988 return NULL;
4991 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
4992 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
4993 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
4995 return op0;
4997 case VECTOR_CST:
4999 unsigned HOST_WIDE_INT i, nelts;
5001 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
5002 return NULL;
5004 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5006 for (i = 0; i < nelts; ++i)
5008 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
5009 if (!op1)
5010 return NULL;
5011 XVECEXP (op0, 0, i) = op1;
5014 return op0;
5017 case CONSTRUCTOR:
5018 if (TREE_CLOBBER_P (exp))
5019 return NULL;
5020 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
5022 unsigned i;
5023 unsigned HOST_WIDE_INT nelts;
5024 tree val;
5026 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
5027 goto flag_unsupported;
5029 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5031 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
5033 op1 = expand_debug_expr (val);
5034 if (!op1)
5035 return NULL;
5036 XVECEXP (op0, 0, i) = op1;
5039 if (i < nelts)
5041 op1 = expand_debug_expr
5042 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
5044 if (!op1)
5045 return NULL;
5047 for (; i < nelts; i++)
5048 XVECEXP (op0, 0, i) = op1;
5051 return op0;
5053 else
5054 goto flag_unsupported;
5056 case CALL_EXPR:
5057 /* ??? Maybe handle some builtins? */
5058 return NULL;
5060 case SSA_NAME:
5062 gimple *g = get_gimple_for_ssa_name (exp);
5063 if (g)
5065 tree t = NULL_TREE;
5066 if (deep_ter_debug_map)
5068 tree *slot = deep_ter_debug_map->get (exp);
5069 if (slot)
5070 t = *slot;
5072 if (t == NULL_TREE)
5073 t = gimple_assign_rhs_to_tree (g);
5074 op0 = expand_debug_expr (t);
5075 if (!op0)
5076 return NULL;
5078 else
5080 /* If this is a reference to an incoming value of
5081 parameter that is never used in the code or where the
5082 incoming value is never used in the code, use
5083 PARM_DECL's DECL_RTL if set. */
5084 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5085 && SSA_NAME_VAR (exp)
5086 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5087 && has_zero_uses (exp))
5089 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5090 if (op0)
5091 goto adjust_mode;
5092 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5093 if (op0)
5094 goto adjust_mode;
5097 int part = var_to_partition (SA.map, exp);
5099 if (part == NO_PARTITION)
5100 return NULL;
5102 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5104 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5106 goto adjust_mode;
5109 case ERROR_MARK:
5110 return NULL;
5112 /* Vector stuff. For most of the codes we don't have rtl codes. */
5113 case REALIGN_LOAD_EXPR:
5114 case VEC_COND_EXPR:
5115 case VEC_PACK_FIX_TRUNC_EXPR:
5116 case VEC_PACK_FLOAT_EXPR:
5117 case VEC_PACK_SAT_EXPR:
5118 case VEC_PACK_TRUNC_EXPR:
5119 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5120 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5121 case VEC_UNPACK_FLOAT_HI_EXPR:
5122 case VEC_UNPACK_FLOAT_LO_EXPR:
5123 case VEC_UNPACK_HI_EXPR:
5124 case VEC_UNPACK_LO_EXPR:
5125 case VEC_WIDEN_MULT_HI_EXPR:
5126 case VEC_WIDEN_MULT_LO_EXPR:
5127 case VEC_WIDEN_MULT_EVEN_EXPR:
5128 case VEC_WIDEN_MULT_ODD_EXPR:
5129 case VEC_WIDEN_LSHIFT_HI_EXPR:
5130 case VEC_WIDEN_LSHIFT_LO_EXPR:
5131 case VEC_PERM_EXPR:
5132 case VEC_DUPLICATE_EXPR:
5133 case VEC_SERIES_EXPR:
5134 return NULL;
5136 /* Misc codes. */
5137 case ADDR_SPACE_CONVERT_EXPR:
5138 case FIXED_CONVERT_EXPR:
5139 case OBJ_TYPE_REF:
5140 case WITH_SIZE_EXPR:
5141 case BIT_INSERT_EXPR:
5142 return NULL;
5144 case DOT_PROD_EXPR:
5145 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5146 && SCALAR_INT_MODE_P (mode))
5149 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5150 0)))
5151 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5152 inner_mode);
5154 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5155 1)))
5156 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5157 inner_mode);
5158 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5159 return simplify_gen_binary (PLUS, mode, op0, op2);
5161 return NULL;
5163 case WIDEN_MULT_EXPR:
5164 case WIDEN_MULT_PLUS_EXPR:
5165 case WIDEN_MULT_MINUS_EXPR:
5166 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5167 && SCALAR_INT_MODE_P (mode))
5169 inner_mode = GET_MODE (op0);
5170 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5171 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5172 else
5173 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5174 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5175 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5176 else
5177 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5178 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5179 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5180 return op0;
5181 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5182 return simplify_gen_binary (PLUS, mode, op0, op2);
5183 else
5184 return simplify_gen_binary (MINUS, mode, op2, op0);
5186 return NULL;
5188 case MULT_HIGHPART_EXPR:
5189 /* ??? Similar to the above. */
5190 return NULL;
5192 case WIDEN_SUM_EXPR:
5193 case WIDEN_LSHIFT_EXPR:
5194 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5195 && SCALAR_INT_MODE_P (mode))
5198 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5199 0)))
5200 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5201 inner_mode);
5202 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5203 ? ASHIFT : PLUS, mode, op0, op1);
5205 return NULL;
5207 default:
5208 flag_unsupported:
5209 if (flag_checking)
5211 debug_tree (exp);
5212 gcc_unreachable ();
5214 return NULL;
5218 /* Return an RTX equivalent to the source bind value of the tree expression
5219 EXP. */
5221 static rtx
5222 expand_debug_source_expr (tree exp)
5224 rtx op0 = NULL_RTX;
5225 machine_mode mode = VOIDmode, inner_mode;
5227 switch (TREE_CODE (exp))
5229 case VAR_DECL:
5230 if (DECL_ABSTRACT_ORIGIN (exp))
5231 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5232 break;
5233 case PARM_DECL:
5235 mode = DECL_MODE (exp);
5236 op0 = expand_debug_parm_decl (exp);
5237 if (op0)
5238 break;
5239 /* See if this isn't an argument that has been completely
5240 optimized out. */
5241 if (!DECL_RTL_SET_P (exp)
5242 && !DECL_INCOMING_RTL (exp)
5243 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5245 tree aexp = DECL_ORIGIN (exp);
5246 if (DECL_CONTEXT (aexp)
5247 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5249 vec<tree, va_gc> **debug_args;
5250 unsigned int ix;
5251 tree ddecl;
5252 debug_args = decl_debug_args_lookup (current_function_decl);
5253 if (debug_args != NULL)
5255 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5256 ix += 2)
5257 if (ddecl == aexp)
5258 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5262 break;
5264 default:
5265 break;
5268 if (op0 == NULL_RTX)
5269 return NULL_RTX;
5271 inner_mode = GET_MODE (op0);
5272 if (mode == inner_mode)
5273 return op0;
5275 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5277 if (GET_MODE_UNIT_BITSIZE (mode)
5278 == GET_MODE_UNIT_BITSIZE (inner_mode))
5279 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5280 else if (GET_MODE_UNIT_BITSIZE (mode)
5281 < GET_MODE_UNIT_BITSIZE (inner_mode))
5282 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5283 else
5284 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5286 else if (FLOAT_MODE_P (mode))
5287 gcc_unreachable ();
5288 else if (FLOAT_MODE_P (inner_mode))
5290 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5291 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5292 else
5293 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5295 else if (GET_MODE_UNIT_PRECISION (mode)
5296 == GET_MODE_UNIT_PRECISION (inner_mode))
5297 op0 = lowpart_subreg (mode, op0, inner_mode);
5298 else if (GET_MODE_UNIT_PRECISION (mode)
5299 < GET_MODE_UNIT_PRECISION (inner_mode))
5300 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5301 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5302 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5303 else
5304 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5306 return op0;
5309 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5310 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5311 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5313 static void
5314 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5316 rtx exp = *exp_p;
5318 if (exp == NULL_RTX)
5319 return;
5321 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5322 return;
5324 if (depth == 4)
5326 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5327 rtx dval = make_debug_expr_from_rtl (exp);
5329 /* Emit a debug bind insn before INSN. */
5330 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5331 DEBUG_EXPR_TREE_DECL (dval), exp,
5332 VAR_INIT_STATUS_INITIALIZED);
5334 emit_debug_insn_before (bind, insn);
5335 *exp_p = dval;
5336 return;
5339 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5340 int i, j;
5341 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5342 switch (*format_ptr++)
5344 case 'e':
5345 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5346 break;
5348 case 'E':
5349 case 'V':
5350 for (j = 0; j < XVECLEN (exp, i); j++)
5351 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5352 break;
5354 default:
5355 break;
5359 /* Expand the _LOCs in debug insns. We run this after expanding all
5360 regular insns, so that any variables referenced in the function
5361 will have their DECL_RTLs set. */
5363 static void
5364 expand_debug_locations (void)
5366 rtx_insn *insn;
5367 rtx_insn *last = get_last_insn ();
5368 int save_strict_alias = flag_strict_aliasing;
5370 /* New alias sets while setting up memory attributes cause
5371 -fcompare-debug failures, even though it doesn't bring about any
5372 codegen changes. */
5373 flag_strict_aliasing = 0;
5375 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5376 if (DEBUG_BIND_INSN_P (insn))
5378 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5379 rtx val;
5380 rtx_insn *prev_insn, *insn2;
5381 machine_mode mode;
5383 if (value == NULL_TREE)
5384 val = NULL_RTX;
5385 else
5387 if (INSN_VAR_LOCATION_STATUS (insn)
5388 == VAR_INIT_STATUS_UNINITIALIZED)
5389 val = expand_debug_source_expr (value);
5390 /* The avoid_deep_ter_for_debug function inserts
5391 debug bind stmts after SSA_NAME definition, with the
5392 SSA_NAME as the whole bind location. Disable temporarily
5393 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5394 being defined in this DEBUG_INSN. */
5395 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5397 tree *slot = deep_ter_debug_map->get (value);
5398 if (slot)
5400 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5401 *slot = NULL_TREE;
5402 else
5403 slot = NULL;
5405 val = expand_debug_expr (value);
5406 if (slot)
5407 *slot = INSN_VAR_LOCATION_DECL (insn);
5409 else
5410 val = expand_debug_expr (value);
5411 gcc_assert (last == get_last_insn ());
5414 if (!val)
5415 val = gen_rtx_UNKNOWN_VAR_LOC ();
5416 else
5418 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5420 gcc_assert (mode == GET_MODE (val)
5421 || (GET_MODE (val) == VOIDmode
5422 && (CONST_SCALAR_INT_P (val)
5423 || GET_CODE (val) == CONST_FIXED
5424 || GET_CODE (val) == LABEL_REF)));
5427 INSN_VAR_LOCATION_LOC (insn) = val;
5428 prev_insn = PREV_INSN (insn);
5429 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5430 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5433 flag_strict_aliasing = save_strict_alias;
5436 /* Performs swapping operands of commutative operations to expand
5437 the expensive one first. */
5439 static void
5440 reorder_operands (basic_block bb)
5442 unsigned int *lattice; /* Hold cost of each statement. */
5443 unsigned int i = 0, n = 0;
5444 gimple_stmt_iterator gsi;
5445 gimple_seq stmts;
5446 gimple *stmt;
5447 bool swap;
5448 tree op0, op1;
5449 ssa_op_iter iter;
5450 use_operand_p use_p;
5451 gimple *def0, *def1;
5453 /* Compute cost of each statement using estimate_num_insns. */
5454 stmts = bb_seq (bb);
5455 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5457 stmt = gsi_stmt (gsi);
5458 if (!is_gimple_debug (stmt))
5459 gimple_set_uid (stmt, n++);
5461 lattice = XNEWVEC (unsigned int, n);
5462 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5464 unsigned cost;
5465 stmt = gsi_stmt (gsi);
5466 if (is_gimple_debug (stmt))
5467 continue;
5468 cost = estimate_num_insns (stmt, &eni_size_weights);
5469 lattice[i] = cost;
5470 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5472 tree use = USE_FROM_PTR (use_p);
5473 gimple *def_stmt;
5474 if (TREE_CODE (use) != SSA_NAME)
5475 continue;
5476 def_stmt = get_gimple_for_ssa_name (use);
5477 if (!def_stmt)
5478 continue;
5479 lattice[i] += lattice[gimple_uid (def_stmt)];
5481 i++;
5482 if (!is_gimple_assign (stmt)
5483 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5484 continue;
5485 op0 = gimple_op (stmt, 1);
5486 op1 = gimple_op (stmt, 2);
5487 if (TREE_CODE (op0) != SSA_NAME
5488 || TREE_CODE (op1) != SSA_NAME)
5489 continue;
5490 /* Swap operands if the second one is more expensive. */
5491 def0 = get_gimple_for_ssa_name (op0);
5492 def1 = get_gimple_for_ssa_name (op1);
5493 if (!def1)
5494 continue;
5495 swap = false;
5496 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5497 swap = true;
5498 if (swap)
5500 if (dump_file && (dump_flags & TDF_DETAILS))
5502 fprintf (dump_file, "Swap operands in stmt:\n");
5503 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5504 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5505 def0 ? lattice[gimple_uid (def0)] : 0,
5506 lattice[gimple_uid (def1)]);
5508 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5509 gimple_assign_rhs2_ptr (stmt));
5512 XDELETE (lattice);
5515 /* Expand basic block BB from GIMPLE trees to RTL. */
5517 static basic_block
5518 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5520 gimple_stmt_iterator gsi;
5521 gimple_seq stmts;
5522 gimple *stmt = NULL;
5523 rtx_note *note = NULL;
5524 rtx_insn *last;
5525 edge e;
5526 edge_iterator ei;
5528 if (dump_file)
5529 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5530 bb->index);
5532 /* Note that since we are now transitioning from GIMPLE to RTL, we
5533 cannot use the gsi_*_bb() routines because they expect the basic
5534 block to be in GIMPLE, instead of RTL. Therefore, we need to
5535 access the BB sequence directly. */
5536 if (optimize)
5537 reorder_operands (bb);
5538 stmts = bb_seq (bb);
5539 bb->il.gimple.seq = NULL;
5540 bb->il.gimple.phi_nodes = NULL;
5541 rtl_profile_for_bb (bb);
5542 init_rtl_bb_info (bb);
5543 bb->flags |= BB_RTL;
5545 /* Remove the RETURN_EXPR if we may fall though to the exit
5546 instead. */
5547 gsi = gsi_last (stmts);
5548 if (!gsi_end_p (gsi)
5549 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5551 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5553 gcc_assert (single_succ_p (bb));
5554 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5556 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5557 && !gimple_return_retval (ret_stmt))
5559 gsi_remove (&gsi, false);
5560 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5564 gsi = gsi_start (stmts);
5565 if (!gsi_end_p (gsi))
5567 stmt = gsi_stmt (gsi);
5568 if (gimple_code (stmt) != GIMPLE_LABEL)
5569 stmt = NULL;
5572 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5574 if (stmt || elt)
5576 gcc_checking_assert (!note);
5577 last = get_last_insn ();
5579 if (stmt)
5581 expand_gimple_stmt (stmt);
5582 gsi_next (&gsi);
5585 if (elt)
5586 emit_label (*elt);
5588 BB_HEAD (bb) = NEXT_INSN (last);
5589 if (NOTE_P (BB_HEAD (bb)))
5590 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5591 gcc_assert (LABEL_P (BB_HEAD (bb)));
5592 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5594 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5596 else
5597 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5599 if (note)
5600 NOTE_BASIC_BLOCK (note) = bb;
5602 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5604 basic_block new_bb;
5606 stmt = gsi_stmt (gsi);
5608 /* If this statement is a non-debug one, and we generate debug
5609 insns, then this one might be the last real use of a TERed
5610 SSA_NAME, but where there are still some debug uses further
5611 down. Expanding the current SSA name in such further debug
5612 uses by their RHS might lead to wrong debug info, as coalescing
5613 might make the operands of such RHS be placed into the same
5614 pseudo as something else. Like so:
5615 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5616 use(a_1);
5617 a_2 = ...
5618 #DEBUG ... => a_1
5619 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5620 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5621 the write to a_2 would actually have clobbered the place which
5622 formerly held a_0.
5624 So, instead of that, we recognize the situation, and generate
5625 debug temporaries at the last real use of TERed SSA names:
5626 a_1 = a_0 + 1;
5627 #DEBUG #D1 => a_1
5628 use(a_1);
5629 a_2 = ...
5630 #DEBUG ... => #D1
5632 if (MAY_HAVE_DEBUG_BIND_INSNS
5633 && SA.values
5634 && !is_gimple_debug (stmt))
5636 ssa_op_iter iter;
5637 tree op;
5638 gimple *def;
5640 location_t sloc = curr_insn_location ();
5642 /* Look for SSA names that have their last use here (TERed
5643 names always have only one real use). */
5644 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5645 if ((def = get_gimple_for_ssa_name (op)))
5647 imm_use_iterator imm_iter;
5648 use_operand_p use_p;
5649 bool have_debug_uses = false;
5651 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5653 if (gimple_debug_bind_p (USE_STMT (use_p)))
5655 have_debug_uses = true;
5656 break;
5660 if (have_debug_uses)
5662 /* OP is a TERed SSA name, with DEF its defining
5663 statement, and where OP is used in further debug
5664 instructions. Generate a debug temporary, and
5665 replace all uses of OP in debug insns with that
5666 temporary. */
5667 gimple *debugstmt;
5668 tree value = gimple_assign_rhs_to_tree (def);
5669 tree vexpr = make_node (DEBUG_EXPR_DECL);
5670 rtx val;
5671 machine_mode mode;
5673 set_curr_insn_location (gimple_location (def));
5675 DECL_ARTIFICIAL (vexpr) = 1;
5676 TREE_TYPE (vexpr) = TREE_TYPE (value);
5677 if (DECL_P (value))
5678 mode = DECL_MODE (value);
5679 else
5680 mode = TYPE_MODE (TREE_TYPE (value));
5681 SET_DECL_MODE (vexpr, mode);
5683 val = gen_rtx_VAR_LOCATION
5684 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5686 emit_debug_insn (val);
5688 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5690 if (!gimple_debug_bind_p (debugstmt))
5691 continue;
5693 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5694 SET_USE (use_p, vexpr);
5696 update_stmt (debugstmt);
5700 set_curr_insn_location (sloc);
5703 currently_expanding_gimple_stmt = stmt;
5705 /* Expand this statement, then evaluate the resulting RTL and
5706 fixup the CFG accordingly. */
5707 if (gimple_code (stmt) == GIMPLE_COND)
5709 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5710 if (new_bb)
5711 return new_bb;
5713 else if (is_gimple_debug (stmt))
5715 location_t sloc = curr_insn_location ();
5716 gimple_stmt_iterator nsi = gsi;
5718 for (;;)
5720 tree var;
5721 tree value = NULL_TREE;
5722 rtx val = NULL_RTX;
5723 machine_mode mode;
5725 if (!gimple_debug_nonbind_marker_p (stmt))
5727 if (gimple_debug_bind_p (stmt))
5729 var = gimple_debug_bind_get_var (stmt);
5731 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5732 && TREE_CODE (var) != LABEL_DECL
5733 && !target_for_debug_bind (var))
5734 goto delink_debug_stmt;
5736 if (DECL_P (var))
5737 mode = DECL_MODE (var);
5738 else
5739 mode = TYPE_MODE (TREE_TYPE (var));
5741 if (gimple_debug_bind_has_value_p (stmt))
5742 value = gimple_debug_bind_get_value (stmt);
5744 val = gen_rtx_VAR_LOCATION
5745 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5747 else if (gimple_debug_source_bind_p (stmt))
5749 var = gimple_debug_source_bind_get_var (stmt);
5751 value = gimple_debug_source_bind_get_value (stmt);
5753 mode = DECL_MODE (var);
5755 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5756 VAR_INIT_STATUS_UNINITIALIZED);
5758 else
5759 gcc_unreachable ();
5761 /* If this function was first compiled with markers
5762 enabled, but they're now disable (e.g. LTO), drop
5763 them on the floor. */
5764 else if (gimple_debug_nonbind_marker_p (stmt)
5765 && !MAY_HAVE_DEBUG_MARKER_INSNS)
5766 goto delink_debug_stmt;
5767 else if (gimple_debug_begin_stmt_p (stmt))
5768 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
5769 else if (gimple_debug_inline_entry_p (stmt))
5771 tree block = gimple_block (stmt);
5773 if (block)
5774 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
5775 else
5776 goto delink_debug_stmt;
5778 else
5779 gcc_unreachable ();
5781 last = get_last_insn ();
5783 set_curr_insn_location (gimple_location (stmt));
5785 emit_debug_insn (val);
5787 if (dump_file && (dump_flags & TDF_DETAILS))
5789 /* We can't dump the insn with a TREE where an RTX
5790 is expected. */
5791 if (GET_CODE (val) == VAR_LOCATION)
5793 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
5794 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5796 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5797 if (GET_CODE (val) == VAR_LOCATION)
5798 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5801 delink_debug_stmt:
5802 /* In order not to generate too many debug temporaries,
5803 we delink all uses of debug statements we already expanded.
5804 Therefore debug statements between definition and real
5805 use of TERed SSA names will continue to use the SSA name,
5806 and not be replaced with debug temps. */
5807 delink_stmt_imm_use (stmt);
5809 gsi = nsi;
5810 gsi_next (&nsi);
5811 if (gsi_end_p (nsi))
5812 break;
5813 stmt = gsi_stmt (nsi);
5814 if (!is_gimple_debug (stmt))
5815 break;
5818 set_curr_insn_location (sloc);
5820 else
5822 gcall *call_stmt = dyn_cast <gcall *> (stmt);
5823 if (call_stmt
5824 && gimple_call_tail_p (call_stmt)
5825 && disable_tail_calls)
5826 gimple_call_set_tail (call_stmt, false);
5828 if (call_stmt && gimple_call_tail_p (call_stmt))
5830 bool can_fallthru;
5831 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
5832 if (new_bb)
5834 if (can_fallthru)
5835 bb = new_bb;
5836 else
5837 return new_bb;
5840 else
5842 def_operand_p def_p;
5843 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5845 if (def_p != NULL)
5847 /* Ignore this stmt if it is in the list of
5848 replaceable expressions. */
5849 if (SA.values
5850 && bitmap_bit_p (SA.values,
5851 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5852 continue;
5854 last = expand_gimple_stmt (stmt);
5855 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5860 currently_expanding_gimple_stmt = NULL;
5862 /* Expand implicit goto and convert goto_locus. */
5863 FOR_EACH_EDGE (e, ei, bb->succs)
5865 if (e->goto_locus != UNKNOWN_LOCATION)
5866 set_curr_insn_location (e->goto_locus);
5867 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5869 emit_jump (label_rtx_for_bb (e->dest));
5870 e->flags &= ~EDGE_FALLTHRU;
5874 /* Expanded RTL can create a jump in the last instruction of block.
5875 This later might be assumed to be a jump to successor and break edge insertion.
5876 We need to insert dummy move to prevent this. PR41440. */
5877 if (single_succ_p (bb)
5878 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5879 && (last = get_last_insn ())
5880 && (JUMP_P (last)
5881 || (DEBUG_INSN_P (last)
5882 && JUMP_P (prev_nondebug_insn (last)))))
5884 rtx dummy = gen_reg_rtx (SImode);
5885 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5888 do_pending_stack_adjust ();
5890 /* Find the block tail. The last insn in the block is the insn
5891 before a barrier and/or table jump insn. */
5892 last = get_last_insn ();
5893 if (BARRIER_P (last))
5894 last = PREV_INSN (last);
5895 if (JUMP_TABLE_DATA_P (last))
5896 last = PREV_INSN (PREV_INSN (last));
5897 if (BARRIER_P (last))
5898 last = PREV_INSN (last);
5899 BB_END (bb) = last;
5901 update_bb_for_insn (bb);
5903 return bb;
5907 /* Create a basic block for initialization code. */
5909 static basic_block
5910 construct_init_block (void)
5912 basic_block init_block, first_block;
5913 edge e = NULL;
5914 int flags;
5916 /* Multiple entry points not supported yet. */
5917 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5918 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5919 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5920 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5921 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5923 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5925 /* When entry edge points to first basic block, we don't need jump,
5926 otherwise we have to jump into proper target. */
5927 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5929 tree label = gimple_block_label (e->dest);
5931 emit_jump (jump_target_rtx (label));
5932 flags = 0;
5934 else
5935 flags = EDGE_FALLTHRU;
5937 init_block = create_basic_block (NEXT_INSN (get_insns ()),
5938 get_last_insn (),
5939 ENTRY_BLOCK_PTR_FOR_FN (cfun));
5940 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5941 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5942 if (e)
5944 first_block = e->dest;
5945 redirect_edge_succ (e, init_block);
5946 e = make_single_succ_edge (init_block, first_block, flags);
5948 else
5949 e = make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5950 EDGE_FALLTHRU);
5952 update_bb_for_insn (init_block);
5953 return init_block;
5956 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
5957 found in the block tree. */
5959 static void
5960 set_block_levels (tree block, int level)
5962 while (block)
5964 BLOCK_NUMBER (block) = level;
5965 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
5966 block = BLOCK_CHAIN (block);
5970 /* Create a block containing landing pads and similar stuff. */
5972 static void
5973 construct_exit_block (void)
5975 rtx_insn *head = get_last_insn ();
5976 rtx_insn *end;
5977 basic_block exit_block;
5978 edge e, e2;
5979 unsigned ix;
5980 edge_iterator ei;
5981 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
5982 rtx_insn *orig_end = BB_END (prev_bb);
5984 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5986 /* Make sure the locus is set to the end of the function, so that
5987 epilogue line numbers and warnings are set properly. */
5988 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
5989 input_location = cfun->function_end_locus;
5991 /* Generate rtl for function exit. */
5992 expand_function_end ();
5994 end = get_last_insn ();
5995 if (head == end)
5996 return;
5997 /* While emitting the function end we could move end of the last basic
5998 block. */
5999 BB_END (prev_bb) = orig_end;
6000 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
6001 head = NEXT_INSN (head);
6002 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
6003 bb count counting will be confused. Any instructions before that
6004 label are emitted for the case where PREV_BB falls through into the
6005 exit block, so append those instructions to prev_bb in that case. */
6006 if (NEXT_INSN (head) != return_label)
6008 while (NEXT_INSN (head) != return_label)
6010 if (!NOTE_P (NEXT_INSN (head)))
6011 BB_END (prev_bb) = NEXT_INSN (head);
6012 head = NEXT_INSN (head);
6015 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
6016 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
6017 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6019 ix = 0;
6020 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
6022 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
6023 if (!(e->flags & EDGE_ABNORMAL))
6024 redirect_edge_succ (e, exit_block);
6025 else
6026 ix++;
6029 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6030 EDGE_FALLTHRU);
6031 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
6032 if (e2 != e)
6034 exit_block->count -= e2->count ();
6036 update_bb_for_insn (exit_block);
6039 /* Helper function for discover_nonconstant_array_refs.
6040 Look for ARRAY_REF nodes with non-constant indexes and mark them
6041 addressable. */
6043 static tree
6044 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
6045 void *data ATTRIBUTE_UNUSED)
6047 tree t = *tp;
6049 if (IS_TYPE_OR_DECL_P (t))
6050 *walk_subtrees = 0;
6051 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6053 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6054 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
6055 && (!TREE_OPERAND (t, 2)
6056 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6057 || (TREE_CODE (t) == COMPONENT_REF
6058 && (!TREE_OPERAND (t,2)
6059 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6060 || TREE_CODE (t) == BIT_FIELD_REF
6061 || TREE_CODE (t) == REALPART_EXPR
6062 || TREE_CODE (t) == IMAGPART_EXPR
6063 || TREE_CODE (t) == VIEW_CONVERT_EXPR
6064 || CONVERT_EXPR_P (t))
6065 t = TREE_OPERAND (t, 0);
6067 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6069 t = get_base_address (t);
6070 if (t && DECL_P (t)
6071 && DECL_MODE (t) != BLKmode)
6072 TREE_ADDRESSABLE (t) = 1;
6075 *walk_subtrees = 0;
6078 return NULL_TREE;
6081 /* RTL expansion is not able to compile array references with variable
6082 offsets for arrays stored in single register. Discover such
6083 expressions and mark variables as addressable to avoid this
6084 scenario. */
6086 static void
6087 discover_nonconstant_array_refs (void)
6089 basic_block bb;
6090 gimple_stmt_iterator gsi;
6092 FOR_EACH_BB_FN (bb, cfun)
6093 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6095 gimple *stmt = gsi_stmt (gsi);
6096 if (!is_gimple_debug (stmt))
6097 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
6101 /* This function sets crtl->args.internal_arg_pointer to a virtual
6102 register if DRAP is needed. Local register allocator will replace
6103 virtual_incoming_args_rtx with the virtual register. */
6105 static void
6106 expand_stack_alignment (void)
6108 rtx drap_rtx;
6109 unsigned int preferred_stack_boundary;
6111 if (! SUPPORTS_STACK_ALIGNMENT)
6112 return;
6114 if (cfun->calls_alloca
6115 || cfun->has_nonlocal_label
6116 || crtl->has_nonlocal_goto)
6117 crtl->need_drap = true;
6119 /* Call update_stack_boundary here again to update incoming stack
6120 boundary. It may set incoming stack alignment to a different
6121 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6122 use the minimum incoming stack alignment to check if it is OK
6123 to perform sibcall optimization since sibcall optimization will
6124 only align the outgoing stack to incoming stack boundary. */
6125 if (targetm.calls.update_stack_boundary)
6126 targetm.calls.update_stack_boundary ();
6128 /* The incoming stack frame has to be aligned at least at
6129 parm_stack_boundary. */
6130 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6132 /* Update crtl->stack_alignment_estimated and use it later to align
6133 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6134 exceptions since callgraph doesn't collect incoming stack alignment
6135 in this case. */
6136 if (cfun->can_throw_non_call_exceptions
6137 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6138 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6139 else
6140 preferred_stack_boundary = crtl->preferred_stack_boundary;
6141 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6142 crtl->stack_alignment_estimated = preferred_stack_boundary;
6143 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6144 crtl->stack_alignment_needed = preferred_stack_boundary;
6146 gcc_assert (crtl->stack_alignment_needed
6147 <= crtl->stack_alignment_estimated);
6149 crtl->stack_realign_needed
6150 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6151 crtl->stack_realign_tried = crtl->stack_realign_needed;
6153 crtl->stack_realign_processed = true;
6155 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6156 alignment. */
6157 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6158 drap_rtx = targetm.calls.get_drap_rtx ();
6160 /* stack_realign_drap and drap_rtx must match. */
6161 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6163 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6164 if (drap_rtx != NULL)
6166 crtl->args.internal_arg_pointer = drap_rtx;
6168 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6169 needed. */
6170 fixup_tail_calls ();
6175 static void
6176 expand_main_function (void)
6178 #if (defined(INVOKE__main) \
6179 || (!defined(HAS_INIT_SECTION) \
6180 && !defined(INIT_SECTION_ASM_OP) \
6181 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6182 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6183 #endif
6187 /* Expand code to initialize the stack_protect_guard. This is invoked at
6188 the beginning of a function to be protected. */
6190 static void
6191 stack_protect_prologue (void)
6193 tree guard_decl = targetm.stack_protect_guard ();
6194 rtx x, y;
6196 x = expand_normal (crtl->stack_protect_guard);
6198 if (targetm.have_stack_protect_combined_set () && guard_decl)
6200 gcc_assert (DECL_P (guard_decl));
6201 y = DECL_RTL (guard_decl);
6203 /* Allow the target to compute address of Y and copy it to X without
6204 leaking Y into a register. This combined address + copy pattern
6205 allows the target to prevent spilling of any intermediate results by
6206 splitting it after register allocator. */
6207 if (rtx_insn *insn = targetm.gen_stack_protect_combined_set (x, y))
6209 emit_insn (insn);
6210 return;
6214 if (guard_decl)
6215 y = expand_normal (guard_decl);
6216 else
6217 y = const0_rtx;
6219 /* Allow the target to copy from Y to X without leaking Y into a
6220 register. */
6221 if (targetm.have_stack_protect_set ())
6222 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6224 emit_insn (insn);
6225 return;
6228 /* Otherwise do a straight move. */
6229 emit_move_insn (x, y);
6232 /* Translate the intermediate representation contained in the CFG
6233 from GIMPLE trees to RTL.
6235 We do conversion per basic block and preserve/update the tree CFG.
6236 This implies we have to do some magic as the CFG can simultaneously
6237 consist of basic blocks containing RTL and GIMPLE trees. This can
6238 confuse the CFG hooks, so be careful to not manipulate CFG during
6239 the expansion. */
6241 namespace {
6243 const pass_data pass_data_expand =
6245 RTL_PASS, /* type */
6246 "expand", /* name */
6247 OPTGROUP_NONE, /* optinfo_flags */
6248 TV_EXPAND, /* tv_id */
6249 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6250 | PROP_gimple_lcx
6251 | PROP_gimple_lvec
6252 | PROP_gimple_lva), /* properties_required */
6253 PROP_rtl, /* properties_provided */
6254 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
6255 0, /* todo_flags_start */
6256 0, /* todo_flags_finish */
6259 class pass_expand : public rtl_opt_pass
6261 public:
6262 pass_expand (gcc::context *ctxt)
6263 : rtl_opt_pass (pass_data_expand, ctxt)
6266 /* opt_pass methods: */
6267 virtual unsigned int execute (function *);
6269 }; // class pass_expand
6271 unsigned int
6272 pass_expand::execute (function *fun)
6274 basic_block bb, init_block;
6275 edge_iterator ei;
6276 edge e;
6277 rtx_insn *var_seq, *var_ret_seq;
6278 unsigned i;
6280 timevar_push (TV_OUT_OF_SSA);
6281 rewrite_out_of_ssa (&SA);
6282 timevar_pop (TV_OUT_OF_SSA);
6283 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6285 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6287 gimple_stmt_iterator gsi;
6288 FOR_EACH_BB_FN (bb, cfun)
6289 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6290 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6291 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6294 /* Make sure all values used by the optimization passes have sane
6295 defaults. */
6296 reg_renumber = 0;
6298 /* Some backends want to know that we are expanding to RTL. */
6299 currently_expanding_to_rtl = 1;
6300 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6301 free_dominance_info (CDI_DOMINATORS);
6303 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6305 insn_locations_init ();
6306 if (!DECL_IS_BUILTIN (current_function_decl))
6308 /* Eventually, all FEs should explicitly set function_start_locus. */
6309 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6310 set_curr_insn_location
6311 (DECL_SOURCE_LOCATION (current_function_decl));
6312 else
6313 set_curr_insn_location (fun->function_start_locus);
6315 else
6316 set_curr_insn_location (UNKNOWN_LOCATION);
6317 prologue_location = curr_insn_location ();
6319 #ifdef INSN_SCHEDULING
6320 init_sched_attrs ();
6321 #endif
6323 /* Make sure first insn is a note even if we don't want linenums.
6324 This makes sure the first insn will never be deleted.
6325 Also, final expects a note to appear there. */
6326 emit_note (NOTE_INSN_DELETED);
6328 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6329 discover_nonconstant_array_refs ();
6331 targetm.expand_to_rtl_hook ();
6332 crtl->init_stack_alignment ();
6333 fun->cfg->max_jumptable_ents = 0;
6335 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6336 of the function section at exapnsion time to predict distance of calls. */
6337 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6339 /* Expand the variables recorded during gimple lowering. */
6340 timevar_push (TV_VAR_EXPAND);
6341 start_sequence ();
6343 var_ret_seq = expand_used_vars ();
6345 var_seq = get_insns ();
6346 end_sequence ();
6347 timevar_pop (TV_VAR_EXPAND);
6349 /* Honor stack protection warnings. */
6350 if (warn_stack_protect)
6352 if (fun->calls_alloca)
6353 warning (OPT_Wstack_protector,
6354 "stack protector not protecting local variables: "
6355 "variable length buffer");
6356 if (has_short_buffer && !crtl->stack_protect_guard)
6357 warning (OPT_Wstack_protector,
6358 "stack protector not protecting function: "
6359 "all local arrays are less than %d bytes long",
6360 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE));
6363 /* Set up parameters and prepare for return, for the function. */
6364 expand_function_start (current_function_decl);
6366 /* If we emitted any instructions for setting up the variables,
6367 emit them before the FUNCTION_START note. */
6368 if (var_seq)
6370 emit_insn_before (var_seq, parm_birth_insn);
6372 /* In expand_function_end we'll insert the alloca save/restore
6373 before parm_birth_insn. We've just insertted an alloca call.
6374 Adjust the pointer to match. */
6375 parm_birth_insn = var_seq;
6378 /* Now propagate the RTL assignment of each partition to the
6379 underlying var of each SSA_NAME. */
6380 tree name;
6382 FOR_EACH_SSA_NAME (i, name, cfun)
6384 /* We might have generated new SSA names in
6385 update_alias_info_with_stack_vars. They will have a NULL
6386 defining statements, and won't be part of the partitioning,
6387 so ignore those. */
6388 if (!SSA_NAME_DEF_STMT (name))
6389 continue;
6391 adjust_one_expanded_partition_var (name);
6394 /* Clean up RTL of variables that straddle across multiple
6395 partitions, and check that the rtl of any PARM_DECLs that are not
6396 cleaned up is that of their default defs. */
6397 FOR_EACH_SSA_NAME (i, name, cfun)
6399 int part;
6401 /* We might have generated new SSA names in
6402 update_alias_info_with_stack_vars. They will have a NULL
6403 defining statements, and won't be part of the partitioning,
6404 so ignore those. */
6405 if (!SSA_NAME_DEF_STMT (name))
6406 continue;
6407 part = var_to_partition (SA.map, name);
6408 if (part == NO_PARTITION)
6409 continue;
6411 /* If this decl was marked as living in multiple places, reset
6412 this now to NULL. */
6413 tree var = SSA_NAME_VAR (name);
6414 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6415 SET_DECL_RTL (var, NULL);
6416 /* Check that the pseudos chosen by assign_parms are those of
6417 the corresponding default defs. */
6418 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6419 && (TREE_CODE (var) == PARM_DECL
6420 || TREE_CODE (var) == RESULT_DECL))
6422 rtx in = DECL_RTL_IF_SET (var);
6423 gcc_assert (in);
6424 rtx out = SA.partition_to_pseudo[part];
6425 gcc_assert (in == out);
6427 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6428 those expected by debug backends for each parm and for
6429 the result. This is particularly important for stabs,
6430 whose register elimination from parm's DECL_RTL may cause
6431 -fcompare-debug differences as SET_DECL_RTL changes reg's
6432 attrs. So, make sure the RTL already has the parm as the
6433 EXPR, so that it won't change. */
6434 SET_DECL_RTL (var, NULL_RTX);
6435 if (MEM_P (in))
6436 set_mem_attributes (in, var, true);
6437 SET_DECL_RTL (var, in);
6441 /* If this function is `main', emit a call to `__main'
6442 to run global initializers, etc. */
6443 if (DECL_NAME (current_function_decl)
6444 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6445 && DECL_FILE_SCOPE_P (current_function_decl))
6446 expand_main_function ();
6448 /* Initialize the stack_protect_guard field. This must happen after the
6449 call to __main (if any) so that the external decl is initialized. */
6450 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6451 stack_protect_prologue ();
6453 expand_phi_nodes (&SA);
6455 /* Release any stale SSA redirection data. */
6456 redirect_edge_var_map_empty ();
6458 /* Register rtl specific functions for cfg. */
6459 rtl_register_cfg_hooks ();
6461 init_block = construct_init_block ();
6463 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6464 remaining edges later. */
6465 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6466 e->flags &= ~EDGE_EXECUTABLE;
6468 /* If the function has too many markers, drop them while expanding. */
6469 if (cfun->debug_marker_count
6470 >= PARAM_VALUE (PARAM_MAX_DEBUG_MARKER_COUNT))
6471 cfun->debug_nonbind_markers = false;
6473 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6474 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6475 next_bb)
6476 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6478 if (MAY_HAVE_DEBUG_BIND_INSNS)
6479 expand_debug_locations ();
6481 if (deep_ter_debug_map)
6483 delete deep_ter_debug_map;
6484 deep_ter_debug_map = NULL;
6487 /* Free stuff we no longer need after GIMPLE optimizations. */
6488 free_dominance_info (CDI_DOMINATORS);
6489 free_dominance_info (CDI_POST_DOMINATORS);
6490 delete_tree_cfg_annotations (fun);
6492 timevar_push (TV_OUT_OF_SSA);
6493 finish_out_of_ssa (&SA);
6494 timevar_pop (TV_OUT_OF_SSA);
6496 timevar_push (TV_POST_EXPAND);
6497 /* We are no longer in SSA form. */
6498 fun->gimple_df->in_ssa_p = false;
6499 loops_state_clear (LOOP_CLOSED_SSA);
6501 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6502 conservatively to true until they are all profile aware. */
6503 delete lab_rtx_for_bb;
6504 free_histograms (fun);
6506 construct_exit_block ();
6507 insn_locations_finalize ();
6509 if (var_ret_seq)
6511 rtx_insn *after = return_label;
6512 rtx_insn *next = NEXT_INSN (after);
6513 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6514 after = next;
6515 emit_insn_after (var_ret_seq, after);
6518 /* Zap the tree EH table. */
6519 set_eh_throw_stmt_table (fun, NULL);
6521 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6522 split edges which edge insertions might do. */
6523 rebuild_jump_labels (get_insns ());
6525 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun),
6526 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6528 edge e;
6529 edge_iterator ei;
6530 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6532 if (e->insns.r)
6534 rebuild_jump_labels_chain (e->insns.r);
6535 /* Put insns after parm birth, but before
6536 NOTE_INSNS_FUNCTION_BEG. */
6537 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (fun)
6538 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6540 rtx_insn *insns = e->insns.r;
6541 e->insns.r = NULL;
6542 if (NOTE_P (parm_birth_insn)
6543 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6544 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6545 else
6546 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6548 else
6549 commit_one_edge_insertion (e);
6551 else
6552 ei_next (&ei);
6556 /* We're done expanding trees to RTL. */
6557 currently_expanding_to_rtl = 0;
6559 flush_mark_addressable_queue ();
6561 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6562 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6564 edge e;
6565 edge_iterator ei;
6566 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6568 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6569 e->flags &= ~EDGE_EXECUTABLE;
6571 /* At the moment not all abnormal edges match the RTL
6572 representation. It is safe to remove them here as
6573 find_many_sub_basic_blocks will rediscover them.
6574 In the future we should get this fixed properly. */
6575 if ((e->flags & EDGE_ABNORMAL)
6576 && !(e->flags & EDGE_SIBCALL))
6577 remove_edge (e);
6578 else
6579 ei_next (&ei);
6583 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6584 bitmap_ones (blocks);
6585 find_many_sub_basic_blocks (blocks);
6586 purge_all_dead_edges ();
6588 /* After initial rtl generation, call back to finish generating
6589 exception support code. We need to do this before cleaning up
6590 the CFG as the code does not expect dead landing pads. */
6591 if (fun->eh->region_tree != NULL)
6592 finish_eh_generation ();
6594 /* Call expand_stack_alignment after finishing all
6595 updates to crtl->preferred_stack_boundary. */
6596 expand_stack_alignment ();
6598 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6599 function. */
6600 if (crtl->tail_call_emit)
6601 fixup_tail_calls ();
6603 /* BB subdivision may have created basic blocks that are are only reachable
6604 from unlikely bbs but not marked as such in the profile. */
6605 if (optimize)
6606 propagate_unlikely_bbs_forward ();
6608 /* Remove unreachable blocks, otherwise we cannot compute dominators
6609 which are needed for loop state verification. As a side-effect
6610 this also compacts blocks.
6611 ??? We cannot remove trivially dead insns here as for example
6612 the DRAP reg on i?86 is not magically live at this point.
6613 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6614 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6616 checking_verify_flow_info ();
6618 /* Initialize pseudos allocated for hard registers. */
6619 emit_initial_value_sets ();
6621 /* And finally unshare all RTL. */
6622 unshare_all_rtl ();
6624 /* There's no need to defer outputting this function any more; we
6625 know we want to output it. */
6626 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6628 /* Now that we're done expanding trees to RTL, we shouldn't have any
6629 more CONCATs anywhere. */
6630 generating_concat_p = 0;
6632 if (dump_file)
6634 fprintf (dump_file,
6635 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6636 /* And the pass manager will dump RTL for us. */
6639 /* If we're emitting a nested function, make sure its parent gets
6640 emitted as well. Doing otherwise confuses debug info. */
6642 tree parent;
6643 for (parent = DECL_CONTEXT (current_function_decl);
6644 parent != NULL_TREE;
6645 parent = get_containing_scope (parent))
6646 if (TREE_CODE (parent) == FUNCTION_DECL)
6647 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6650 TREE_ASM_WRITTEN (current_function_decl) = 1;
6652 /* After expanding, the return labels are no longer needed. */
6653 return_label = NULL;
6654 naked_return_label = NULL;
6656 /* After expanding, the tm_restart map is no longer needed. */
6657 if (fun->gimple_df->tm_restart)
6658 fun->gimple_df->tm_restart = NULL;
6660 /* Tag the blocks with a depth number so that change_scope can find
6661 the common parent easily. */
6662 set_block_levels (DECL_INITIAL (fun->decl), 0);
6663 default_rtl_profile ();
6665 /* For -dx discard loops now, otherwise IL verify in clean_state will
6666 ICE. */
6667 if (rtl_dump_and_exit)
6669 cfun->curr_properties &= ~PROP_loops;
6670 loop_optimizer_finalize ();
6673 timevar_pop (TV_POST_EXPAND);
6675 return 0;
6678 } // anon namespace
6680 rtl_opt_pass *
6681 make_pass_expand (gcc::context *ctxt)
6683 return new pass_expand (ctxt);