Relocation (= move+destroy)
[official-gcc.git] / gcc / cfgexpand.c
blob9d1eab6dfe2ef7c254a550fb781ca300f7a79f38
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2018 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "params.h"
65 #include "tree-inline.h"
66 #include "value-prof.h"
67 #include "tree-ssa-live.h"
68 #include "tree-outof-ssa.h"
69 #include "cfgloop.h"
70 #include "insn-attr.h" /* For INSN_SCHEDULING. */
71 #include "stringpool.h"
72 #include "attribs.h"
73 #include "asan.h"
74 #include "tree-ssa-address.h"
75 #include "output.h"
76 #include "builtins.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 enum gimple_rhs_class grhs_class;
109 grhs_class = get_gimple_rhs_class (gimple_expr_code (stmt));
111 if (grhs_class == GIMPLE_TERNARY_RHS)
112 t = build3 (gimple_assign_rhs_code (stmt),
113 TREE_TYPE (gimple_assign_lhs (stmt)),
114 gimple_assign_rhs1 (stmt),
115 gimple_assign_rhs2 (stmt),
116 gimple_assign_rhs3 (stmt));
117 else if (grhs_class == GIMPLE_BINARY_RHS)
118 t = build2 (gimple_assign_rhs_code (stmt),
119 TREE_TYPE (gimple_assign_lhs (stmt)),
120 gimple_assign_rhs1 (stmt),
121 gimple_assign_rhs2 (stmt));
122 else if (grhs_class == GIMPLE_UNARY_RHS)
123 t = build1 (gimple_assign_rhs_code (stmt),
124 TREE_TYPE (gimple_assign_lhs (stmt)),
125 gimple_assign_rhs1 (stmt));
126 else if (grhs_class == GIMPLE_SINGLE_RHS)
128 t = gimple_assign_rhs1 (stmt);
129 /* Avoid modifying this tree in place below. */
130 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
131 && gimple_location (stmt) != EXPR_LOCATION (t))
132 || (gimple_block (stmt)
133 && currently_expanding_to_rtl
134 && EXPR_P (t)))
135 t = copy_node (t);
137 else
138 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 struct stack_var
310 /* The Variable. */
311 tree decl;
313 /* Initially, the size of the variable. Later, the size of the partition,
314 if this variable becomes it's partition's representative. */
315 poly_uint64 size;
317 /* The *byte* alignment required for this variable. Or as, with the
318 size, the alignment for this partition. */
319 unsigned int alignb;
321 /* The partition representative. */
322 size_t representative;
324 /* The next stack variable in the partition, or EOC. */
325 size_t next;
327 /* The numbers of conflicting stack variables. */
328 bitmap conflicts;
331 #define EOC ((size_t)-1)
333 /* We have an array of such objects while deciding allocation. */
334 static struct stack_var *stack_vars;
335 static size_t stack_vars_alloc;
336 static size_t stack_vars_num;
337 static hash_map<tree, size_t> *decl_to_stack_part;
339 /* Conflict bitmaps go on this obstack. This allows us to destroy
340 all of them in one big sweep. */
341 static bitmap_obstack stack_var_bitmap_obstack;
343 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
344 is non-decreasing. */
345 static size_t *stack_vars_sorted;
347 /* The phase of the stack frame. This is the known misalignment of
348 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
349 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
350 static int frame_phase;
352 /* Used during expand_used_vars to remember if we saw any decls for
353 which we'd like to enable stack smashing protection. */
354 static bool has_protected_decls;
356 /* Used during expand_used_vars. Remember if we say a character buffer
357 smaller than our cutoff threshold. Used for -Wstack-protector. */
358 static bool has_short_buffer;
360 /* Compute the byte alignment to use for DECL. Ignore alignment
361 we can't do with expected alignment of the stack boundary. */
363 static unsigned int
364 align_local_variable (tree decl)
366 unsigned int align;
368 if (TREE_CODE (decl) == SSA_NAME)
369 align = TYPE_ALIGN (TREE_TYPE (decl));
370 else
372 align = LOCAL_DECL_ALIGNMENT (decl);
373 SET_DECL_ALIGN (decl, align);
375 return align / BITS_PER_UNIT;
378 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
379 down otherwise. Return truncated BASE value. */
381 static inline unsigned HOST_WIDE_INT
382 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
384 return align_up ? (base + align - 1) & -align : base & -align;
387 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
388 Return the frame offset. */
390 static poly_int64
391 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
393 poly_int64 offset, new_frame_offset;
395 if (FRAME_GROWS_DOWNWARD)
397 new_frame_offset
398 = aligned_lower_bound (frame_offset - frame_phase - size,
399 align) + frame_phase;
400 offset = new_frame_offset;
402 else
404 new_frame_offset
405 = aligned_upper_bound (frame_offset - frame_phase,
406 align) + frame_phase;
407 offset = new_frame_offset;
408 new_frame_offset += size;
410 frame_offset = new_frame_offset;
412 if (frame_offset_overflow (frame_offset, cfun->decl))
413 frame_offset = offset = 0;
415 return offset;
418 /* Accumulate DECL into STACK_VARS. */
420 static void
421 add_stack_var (tree decl)
423 struct stack_var *v;
425 if (stack_vars_num >= stack_vars_alloc)
427 if (stack_vars_alloc)
428 stack_vars_alloc = stack_vars_alloc * 3 / 2;
429 else
430 stack_vars_alloc = 32;
431 stack_vars
432 = XRESIZEVEC (struct stack_var, stack_vars, stack_vars_alloc);
434 if (!decl_to_stack_part)
435 decl_to_stack_part = new hash_map<tree, size_t>;
437 v = &stack_vars[stack_vars_num];
438 decl_to_stack_part->put (decl, stack_vars_num);
440 v->decl = decl;
441 tree size = TREE_CODE (decl) == SSA_NAME
442 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
443 : DECL_SIZE_UNIT (decl);
444 v->size = tree_to_poly_uint64 (size);
445 /* Ensure that all variables have size, so that &a != &b for any two
446 variables that are simultaneously live. */
447 if (known_eq (v->size, 0U))
448 v->size = 1;
449 v->alignb = align_local_variable (decl);
450 /* An alignment of zero can mightily confuse us later. */
451 gcc_assert (v->alignb != 0);
453 /* All variables are initially in their own partition. */
454 v->representative = stack_vars_num;
455 v->next = EOC;
457 /* All variables initially conflict with no other. */
458 v->conflicts = NULL;
460 /* Ensure that this decl doesn't get put onto the list twice. */
461 set_rtl (decl, pc_rtx);
463 stack_vars_num++;
466 /* Make the decls associated with luid's X and Y conflict. */
468 static void
469 add_stack_var_conflict (size_t x, size_t y)
471 struct stack_var *a = &stack_vars[x];
472 struct stack_var *b = &stack_vars[y];
473 if (!a->conflicts)
474 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
475 if (!b->conflicts)
476 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
477 bitmap_set_bit (a->conflicts, y);
478 bitmap_set_bit (b->conflicts, x);
481 /* Check whether the decls associated with luid's X and Y conflict. */
483 static bool
484 stack_var_conflict_p (size_t x, size_t y)
486 struct stack_var *a = &stack_vars[x];
487 struct stack_var *b = &stack_vars[y];
488 if (x == y)
489 return false;
490 /* Partitions containing an SSA name result from gimple registers
491 with things like unsupported modes. They are top-level and
492 hence conflict with everything else. */
493 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
494 return true;
496 if (!a->conflicts || !b->conflicts)
497 return false;
498 return bitmap_bit_p (a->conflicts, y);
501 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
502 enter its partition number into bitmap DATA. */
504 static bool
505 visit_op (gimple *, tree op, tree, void *data)
507 bitmap active = (bitmap)data;
508 op = get_base_address (op);
509 if (op
510 && DECL_P (op)
511 && DECL_RTL_IF_SET (op) == pc_rtx)
513 size_t *v = decl_to_stack_part->get (op);
514 if (v)
515 bitmap_set_bit (active, *v);
517 return false;
520 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
521 record conflicts between it and all currently active other partitions
522 from bitmap DATA. */
524 static bool
525 visit_conflict (gimple *, tree op, tree, void *data)
527 bitmap active = (bitmap)data;
528 op = get_base_address (op);
529 if (op
530 && DECL_P (op)
531 && DECL_RTL_IF_SET (op) == pc_rtx)
533 size_t *v = decl_to_stack_part->get (op);
534 if (v && bitmap_set_bit (active, *v))
536 size_t num = *v;
537 bitmap_iterator bi;
538 unsigned i;
539 gcc_assert (num < stack_vars_num);
540 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
541 add_stack_var_conflict (num, i);
544 return false;
547 /* Helper routine for add_scope_conflicts, calculating the active partitions
548 at the end of BB, leaving the result in WORK. We're called to generate
549 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
550 liveness. */
552 static void
553 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
555 edge e;
556 edge_iterator ei;
557 gimple_stmt_iterator gsi;
558 walk_stmt_load_store_addr_fn visit;
560 bitmap_clear (work);
561 FOR_EACH_EDGE (e, ei, bb->preds)
562 bitmap_ior_into (work, (bitmap)e->src->aux);
564 visit = visit_op;
566 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
568 gimple *stmt = gsi_stmt (gsi);
569 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
571 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
573 gimple *stmt = gsi_stmt (gsi);
575 if (gimple_clobber_p (stmt))
577 tree lhs = gimple_assign_lhs (stmt);
578 size_t *v;
579 /* Nested function lowering might introduce LHSs
580 that are COMPONENT_REFs. */
581 if (!VAR_P (lhs))
582 continue;
583 if (DECL_RTL_IF_SET (lhs) == pc_rtx
584 && (v = decl_to_stack_part->get (lhs)))
585 bitmap_clear_bit (work, *v);
587 else if (!is_gimple_debug (stmt))
589 if (for_conflict
590 && visit == visit_op)
592 /* If this is the first real instruction in this BB we need
593 to add conflicts for everything live at this point now.
594 Unlike classical liveness for named objects we can't
595 rely on seeing a def/use of the names we're interested in.
596 There might merely be indirect loads/stores. We'd not add any
597 conflicts for such partitions. */
598 bitmap_iterator bi;
599 unsigned i;
600 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
602 struct stack_var *a = &stack_vars[i];
603 if (!a->conflicts)
604 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
605 bitmap_ior_into (a->conflicts, work);
607 visit = visit_conflict;
609 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
614 /* Generate stack partition conflicts between all partitions that are
615 simultaneously live. */
617 static void
618 add_scope_conflicts (void)
620 basic_block bb;
621 bool changed;
622 bitmap work = BITMAP_ALLOC (NULL);
623 int *rpo;
624 int n_bbs;
626 /* We approximate the live range of a stack variable by taking the first
627 mention of its name as starting point(s), and by the end-of-scope
628 death clobber added by gimplify as ending point(s) of the range.
629 This overapproximates in the case we for instance moved an address-taken
630 operation upward, without also moving a dereference to it upwards.
631 But it's conservatively correct as a variable never can hold values
632 before its name is mentioned at least once.
634 We then do a mostly classical bitmap liveness algorithm. */
636 FOR_ALL_BB_FN (bb, cfun)
637 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
639 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
640 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
642 changed = true;
643 while (changed)
645 int i;
646 changed = false;
647 for (i = 0; i < n_bbs; i++)
649 bitmap active;
650 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
651 active = (bitmap)bb->aux;
652 add_scope_conflicts_1 (bb, work, false);
653 if (bitmap_ior_into (active, work))
654 changed = true;
658 FOR_EACH_BB_FN (bb, cfun)
659 add_scope_conflicts_1 (bb, work, true);
661 free (rpo);
662 BITMAP_FREE (work);
663 FOR_ALL_BB_FN (bb, cfun)
664 BITMAP_FREE (bb->aux);
667 /* A subroutine of partition_stack_vars. A comparison function for qsort,
668 sorting an array of indices by the properties of the object. */
670 static int
671 stack_var_cmp (const void *a, const void *b)
673 size_t ia = *(const size_t *)a;
674 size_t ib = *(const size_t *)b;
675 unsigned int aligna = stack_vars[ia].alignb;
676 unsigned int alignb = stack_vars[ib].alignb;
677 poly_int64 sizea = stack_vars[ia].size;
678 poly_int64 sizeb = stack_vars[ib].size;
679 tree decla = stack_vars[ia].decl;
680 tree declb = stack_vars[ib].decl;
681 bool largea, largeb;
682 unsigned int uida, uidb;
684 /* Primary compare on "large" alignment. Large comes first. */
685 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
686 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
687 if (largea != largeb)
688 return (int)largeb - (int)largea;
690 /* Secondary compare on size, decreasing */
691 int diff = compare_sizes_for_sort (sizeb, sizea);
692 if (diff != 0)
693 return diff;
695 /* Tertiary compare on true alignment, decreasing. */
696 if (aligna < alignb)
697 return -1;
698 if (aligna > alignb)
699 return 1;
701 /* Final compare on ID for sort stability, increasing.
702 Two SSA names are compared by their version, SSA names come before
703 non-SSA names, and two normal decls are compared by their DECL_UID. */
704 if (TREE_CODE (decla) == SSA_NAME)
706 if (TREE_CODE (declb) == SSA_NAME)
707 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
708 else
709 return -1;
711 else if (TREE_CODE (declb) == SSA_NAME)
712 return 1;
713 else
714 uida = DECL_UID (decla), uidb = DECL_UID (declb);
715 if (uida < uidb)
716 return 1;
717 if (uida > uidb)
718 return -1;
719 return 0;
722 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
723 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
725 /* If the points-to solution *PI points to variables that are in a partition
726 together with other variables add all partition members to the pointed-to
727 variables bitmap. */
729 static void
730 add_partitioned_vars_to_ptset (struct pt_solution *pt,
731 part_hashmap *decls_to_partitions,
732 hash_set<bitmap> *visited, bitmap temp)
734 bitmap_iterator bi;
735 unsigned i;
736 bitmap *part;
738 if (pt->anything
739 || pt->vars == NULL
740 /* The pointed-to vars bitmap is shared, it is enough to
741 visit it once. */
742 || visited->add (pt->vars))
743 return;
745 bitmap_clear (temp);
747 /* By using a temporary bitmap to store all members of the partitions
748 we have to add we make sure to visit each of the partitions only
749 once. */
750 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
751 if ((!temp
752 || !bitmap_bit_p (temp, i))
753 && (part = decls_to_partitions->get (i)))
754 bitmap_ior_into (temp, *part);
755 if (!bitmap_empty_p (temp))
756 bitmap_ior_into (pt->vars, temp);
759 /* Update points-to sets based on partition info, so we can use them on RTL.
760 The bitmaps representing stack partitions will be saved until expand,
761 where partitioned decls used as bases in memory expressions will be
762 rewritten. */
764 static void
765 update_alias_info_with_stack_vars (void)
767 part_hashmap *decls_to_partitions = NULL;
768 size_t i, j;
769 tree var = NULL_TREE;
771 for (i = 0; i < stack_vars_num; i++)
773 bitmap part = NULL;
774 tree name;
775 struct ptr_info_def *pi;
777 /* Not interested in partitions with single variable. */
778 if (stack_vars[i].representative != i
779 || stack_vars[i].next == EOC)
780 continue;
782 if (!decls_to_partitions)
784 decls_to_partitions = new part_hashmap;
785 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
788 /* Create an SSA_NAME that points to the partition for use
789 as base during alias-oracle queries on RTL for bases that
790 have been partitioned. */
791 if (var == NULL_TREE)
792 var = create_tmp_var (ptr_type_node);
793 name = make_ssa_name (var);
795 /* Create bitmaps representing partitions. They will be used for
796 points-to sets later, so use GGC alloc. */
797 part = BITMAP_GGC_ALLOC ();
798 for (j = i; j != EOC; j = stack_vars[j].next)
800 tree decl = stack_vars[j].decl;
801 unsigned int uid = DECL_PT_UID (decl);
802 bitmap_set_bit (part, uid);
803 decls_to_partitions->put (uid, part);
804 cfun->gimple_df->decls_to_pointers->put (decl, name);
805 if (TREE_ADDRESSABLE (decl))
806 TREE_ADDRESSABLE (name) = 1;
809 /* Make the SSA name point to all partition members. */
810 pi = get_ptr_info (name);
811 pt_solution_set (&pi->pt, part, false);
814 /* Make all points-to sets that contain one member of a partition
815 contain all members of the partition. */
816 if (decls_to_partitions)
818 unsigned i;
819 tree name;
820 hash_set<bitmap> visited;
821 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
823 FOR_EACH_SSA_NAME (i, name, cfun)
825 struct ptr_info_def *pi;
827 if (POINTER_TYPE_P (TREE_TYPE (name))
828 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
829 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
830 &visited, temp);
833 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
834 decls_to_partitions, &visited, temp);
836 delete decls_to_partitions;
837 BITMAP_FREE (temp);
841 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
842 partitioning algorithm. Partitions A and B are known to be non-conflicting.
843 Merge them into a single partition A. */
845 static void
846 union_stack_vars (size_t a, size_t b)
848 struct stack_var *vb = &stack_vars[b];
849 bitmap_iterator bi;
850 unsigned u;
852 gcc_assert (stack_vars[b].next == EOC);
853 /* Add B to A's partition. */
854 stack_vars[b].next = stack_vars[a].next;
855 stack_vars[b].representative = a;
856 stack_vars[a].next = b;
858 /* Update the required alignment of partition A to account for B. */
859 if (stack_vars[a].alignb < stack_vars[b].alignb)
860 stack_vars[a].alignb = stack_vars[b].alignb;
862 /* Update the interference graph and merge the conflicts. */
863 if (vb->conflicts)
865 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
866 add_stack_var_conflict (a, stack_vars[u].representative);
867 BITMAP_FREE (vb->conflicts);
871 /* A subroutine of expand_used_vars. Binpack the variables into
872 partitions constrained by the interference graph. The overall
873 algorithm used is as follows:
875 Sort the objects by size in descending order.
876 For each object A {
877 S = size(A)
878 O = 0
879 loop {
880 Look for the largest non-conflicting object B with size <= S.
881 UNION (A, B)
886 static void
887 partition_stack_vars (void)
889 size_t si, sj, n = stack_vars_num;
891 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
892 for (si = 0; si < n; ++si)
893 stack_vars_sorted[si] = si;
895 if (n == 1)
896 return;
898 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
900 for (si = 0; si < n; ++si)
902 size_t i = stack_vars_sorted[si];
903 unsigned int ialign = stack_vars[i].alignb;
904 poly_int64 isize = stack_vars[i].size;
906 /* Ignore objects that aren't partition representatives. If we
907 see a var that is not a partition representative, it must
908 have been merged earlier. */
909 if (stack_vars[i].representative != i)
910 continue;
912 for (sj = si + 1; sj < n; ++sj)
914 size_t j = stack_vars_sorted[sj];
915 unsigned int jalign = stack_vars[j].alignb;
916 poly_int64 jsize = stack_vars[j].size;
918 /* Ignore objects that aren't partition representatives. */
919 if (stack_vars[j].representative != j)
920 continue;
922 /* Do not mix objects of "small" (supported) alignment
923 and "large" (unsupported) alignment. */
924 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
925 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
926 break;
928 /* For Address Sanitizer do not mix objects with different
929 sizes, as the shorter vars wouldn't be adequately protected.
930 Don't do that for "large" (unsupported) alignment objects,
931 those aren't protected anyway. */
932 if (asan_sanitize_stack_p ()
933 && maybe_ne (isize, jsize)
934 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
935 break;
937 /* Ignore conflicting objects. */
938 if (stack_var_conflict_p (i, j))
939 continue;
941 /* UNION the objects, placing J at OFFSET. */
942 union_stack_vars (i, j);
946 update_alias_info_with_stack_vars ();
949 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
951 static void
952 dump_stack_var_partition (void)
954 size_t si, i, j, n = stack_vars_num;
956 for (si = 0; si < n; ++si)
958 i = stack_vars_sorted[si];
960 /* Skip variables that aren't partition representatives, for now. */
961 if (stack_vars[i].representative != i)
962 continue;
964 fprintf (dump_file, "Partition %lu: size ", (unsigned long) i);
965 print_dec (stack_vars[i].size, dump_file);
966 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
968 for (j = i; j != EOC; j = stack_vars[j].next)
970 fputc ('\t', dump_file);
971 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
973 fputc ('\n', dump_file);
977 /* Assign rtl to DECL at BASE + OFFSET. */
979 static void
980 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
981 poly_int64 offset)
983 unsigned align;
984 rtx x;
986 /* If this fails, we've overflowed the stack frame. Error nicely? */
987 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
989 x = plus_constant (Pmode, base, offset);
990 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
991 ? TYPE_MODE (TREE_TYPE (decl))
992 : DECL_MODE (SSAVAR (decl)), x);
994 if (TREE_CODE (decl) != SSA_NAME)
996 /* Set alignment we actually gave this decl if it isn't an SSA name.
997 If it is we generate stack slots only accidentally so it isn't as
998 important, we'll simply use the alignment that is already set. */
999 if (base == virtual_stack_vars_rtx)
1000 offset -= frame_phase;
1001 align = known_alignment (offset);
1002 align *= BITS_PER_UNIT;
1003 if (align == 0 || align > base_align)
1004 align = base_align;
1006 /* One would think that we could assert that we're not decreasing
1007 alignment here, but (at least) the i386 port does exactly this
1008 via the MINIMUM_ALIGNMENT hook. */
1010 SET_DECL_ALIGN (decl, align);
1011 DECL_USER_ALIGN (decl) = 0;
1014 set_rtl (decl, x);
1017 struct stack_vars_data
1019 /* Vector of offset pairs, always end of some padding followed
1020 by start of the padding that needs Address Sanitizer protection.
1021 The vector is in reversed, highest offset pairs come first. */
1022 auto_vec<HOST_WIDE_INT> asan_vec;
1024 /* Vector of partition representative decls in between the paddings. */
1025 auto_vec<tree> asan_decl_vec;
1027 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1028 rtx asan_base;
1030 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1031 unsigned int asan_alignb;
1034 /* A subroutine of expand_used_vars. Give each partition representative
1035 a unique location within the stack frame. Update each partition member
1036 with that location. */
1038 static void
1039 expand_stack_vars (bool (*pred) (size_t), struct stack_vars_data *data)
1041 size_t si, i, j, n = stack_vars_num;
1042 poly_uint64 large_size = 0, large_alloc = 0;
1043 rtx large_base = NULL;
1044 unsigned large_align = 0;
1045 bool large_allocation_done = false;
1046 tree decl;
1048 /* Determine if there are any variables requiring "large" alignment.
1049 Since these are dynamically allocated, we only process these if
1050 no predicate involved. */
1051 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1052 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1054 /* Find the total size of these variables. */
1055 for (si = 0; si < n; ++si)
1057 unsigned alignb;
1059 i = stack_vars_sorted[si];
1060 alignb = stack_vars[i].alignb;
1062 /* All "large" alignment decls come before all "small" alignment
1063 decls, but "large" alignment decls are not sorted based on
1064 their alignment. Increase large_align to track the largest
1065 required alignment. */
1066 if ((alignb * BITS_PER_UNIT) > large_align)
1067 large_align = alignb * BITS_PER_UNIT;
1069 /* Stop when we get to the first decl with "small" alignment. */
1070 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1071 break;
1073 /* Skip variables that aren't partition representatives. */
1074 if (stack_vars[i].representative != i)
1075 continue;
1077 /* Skip variables that have already had rtl assigned. See also
1078 add_stack_var where we perpetrate this pc_rtx hack. */
1079 decl = stack_vars[i].decl;
1080 if (TREE_CODE (decl) == SSA_NAME
1081 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1082 : DECL_RTL (decl) != pc_rtx)
1083 continue;
1085 large_size = aligned_upper_bound (large_size, alignb);
1086 large_size += stack_vars[i].size;
1090 for (si = 0; si < n; ++si)
1092 rtx base;
1093 unsigned base_align, alignb;
1094 poly_int64 offset;
1096 i = stack_vars_sorted[si];
1098 /* Skip variables that aren't partition representatives, for now. */
1099 if (stack_vars[i].representative != i)
1100 continue;
1102 /* Skip variables that have already had rtl assigned. See also
1103 add_stack_var where we perpetrate this pc_rtx hack. */
1104 decl = stack_vars[i].decl;
1105 if (TREE_CODE (decl) == SSA_NAME
1106 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1107 : DECL_RTL (decl) != pc_rtx)
1108 continue;
1110 /* Check the predicate to see whether this variable should be
1111 allocated in this pass. */
1112 if (pred && !pred (i))
1113 continue;
1115 alignb = stack_vars[i].alignb;
1116 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1118 base = virtual_stack_vars_rtx;
1119 /* ASAN description strings don't yet have a syntax for expressing
1120 polynomial offsets. */
1121 HOST_WIDE_INT prev_offset;
1122 if (asan_sanitize_stack_p ()
1123 && pred
1124 && frame_offset.is_constant (&prev_offset)
1125 && stack_vars[i].size.is_constant ())
1127 prev_offset = align_base (prev_offset,
1128 MAX (alignb, ASAN_RED_ZONE_SIZE),
1129 !FRAME_GROWS_DOWNWARD);
1130 tree repr_decl = NULL_TREE;
1131 offset
1132 = alloc_stack_frame_space (stack_vars[i].size
1133 + ASAN_RED_ZONE_SIZE,
1134 MAX (alignb, ASAN_RED_ZONE_SIZE));
1136 data->asan_vec.safe_push (prev_offset);
1137 /* Allocating a constant amount of space from a constant
1138 starting offset must give a constant result. */
1139 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1140 .to_constant ());
1141 /* Find best representative of the partition.
1142 Prefer those with DECL_NAME, even better
1143 satisfying asan_protect_stack_decl predicate. */
1144 for (j = i; j != EOC; j = stack_vars[j].next)
1145 if (asan_protect_stack_decl (stack_vars[j].decl)
1146 && DECL_NAME (stack_vars[j].decl))
1148 repr_decl = stack_vars[j].decl;
1149 break;
1151 else if (repr_decl == NULL_TREE
1152 && DECL_P (stack_vars[j].decl)
1153 && DECL_NAME (stack_vars[j].decl))
1154 repr_decl = stack_vars[j].decl;
1155 if (repr_decl == NULL_TREE)
1156 repr_decl = stack_vars[i].decl;
1157 data->asan_decl_vec.safe_push (repr_decl);
1159 /* Make sure a representative is unpoison if another
1160 variable in the partition is handled by
1161 use-after-scope sanitization. */
1162 if (asan_handled_variables != NULL
1163 && !asan_handled_variables->contains (repr_decl))
1165 for (j = i; j != EOC; j = stack_vars[j].next)
1166 if (asan_handled_variables->contains (stack_vars[j].decl))
1167 break;
1168 if (j != EOC)
1169 asan_handled_variables->add (repr_decl);
1172 data->asan_alignb = MAX (data->asan_alignb, alignb);
1173 if (data->asan_base == NULL)
1174 data->asan_base = gen_reg_rtx (Pmode);
1175 base = data->asan_base;
1177 if (!STRICT_ALIGNMENT)
1178 base_align = crtl->max_used_stack_slot_alignment;
1179 else
1180 base_align = MAX (crtl->max_used_stack_slot_alignment,
1181 GET_MODE_ALIGNMENT (SImode)
1182 << ASAN_SHADOW_SHIFT);
1184 else
1186 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1187 base_align = crtl->max_used_stack_slot_alignment;
1190 else
1192 /* Large alignment is only processed in the last pass. */
1193 if (pred)
1194 continue;
1196 /* If there were any variables requiring "large" alignment, allocate
1197 space. */
1198 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1200 poly_int64 loffset;
1201 rtx large_allocsize;
1203 large_allocsize = gen_int_mode (large_size, Pmode);
1204 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1205 loffset = alloc_stack_frame_space
1206 (rtx_to_poly_int64 (large_allocsize),
1207 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1208 large_base = get_dynamic_stack_base (loffset, large_align);
1209 large_allocation_done = true;
1211 gcc_assert (large_base != NULL);
1213 large_alloc = aligned_upper_bound (large_alloc, alignb);
1214 offset = large_alloc;
1215 large_alloc += stack_vars[i].size;
1217 base = large_base;
1218 base_align = large_align;
1221 /* Create rtl for each variable based on their location within the
1222 partition. */
1223 for (j = i; j != EOC; j = stack_vars[j].next)
1225 expand_one_stack_var_at (stack_vars[j].decl,
1226 base, base_align,
1227 offset);
1231 gcc_assert (known_eq (large_alloc, large_size));
1234 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1235 static poly_uint64
1236 account_stack_vars (void)
1238 size_t si, j, i, n = stack_vars_num;
1239 poly_uint64 size = 0;
1241 for (si = 0; si < n; ++si)
1243 i = stack_vars_sorted[si];
1245 /* Skip variables that aren't partition representatives, for now. */
1246 if (stack_vars[i].representative != i)
1247 continue;
1249 size += stack_vars[i].size;
1250 for (j = i; j != EOC; j = stack_vars[j].next)
1251 set_rtl (stack_vars[j].decl, NULL);
1253 return size;
1256 /* Record the RTL assignment X for the default def of PARM. */
1258 extern void
1259 set_parm_rtl (tree parm, rtx x)
1261 gcc_assert (TREE_CODE (parm) == PARM_DECL
1262 || TREE_CODE (parm) == RESULT_DECL);
1264 if (x && !MEM_P (x))
1266 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1267 TYPE_MODE (TREE_TYPE (parm)),
1268 TYPE_ALIGN (TREE_TYPE (parm)));
1270 /* If the variable alignment is very large we'll dynamicaly
1271 allocate it, which means that in-frame portion is just a
1272 pointer. ??? We've got a pseudo for sure here, do we
1273 actually dynamically allocate its spilling area if needed?
1274 ??? Isn't it a problem when Pmode alignment also exceeds
1275 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1276 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1277 align = GET_MODE_ALIGNMENT (Pmode);
1279 record_alignment_for_reg_var (align);
1282 tree ssa = ssa_default_def (cfun, parm);
1283 if (!ssa)
1284 return set_rtl (parm, x);
1286 int part = var_to_partition (SA.map, ssa);
1287 gcc_assert (part != NO_PARTITION);
1289 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1290 gcc_assert (changed);
1292 set_rtl (ssa, x);
1293 gcc_assert (DECL_RTL (parm) == x);
1296 /* A subroutine of expand_one_var. Called to immediately assign rtl
1297 to a variable to be allocated in the stack frame. */
1299 static void
1300 expand_one_stack_var_1 (tree var)
1302 poly_uint64 size;
1303 poly_int64 offset;
1304 unsigned byte_align;
1306 if (TREE_CODE (var) == SSA_NAME)
1308 tree type = TREE_TYPE (var);
1309 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1310 byte_align = TYPE_ALIGN_UNIT (type);
1312 else
1314 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1315 byte_align = align_local_variable (var);
1318 /* We handle highly aligned variables in expand_stack_vars. */
1319 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1321 offset = alloc_stack_frame_space (size, byte_align);
1323 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1324 crtl->max_used_stack_slot_alignment, offset);
1327 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1328 already assigned some MEM. */
1330 static void
1331 expand_one_stack_var (tree var)
1333 if (TREE_CODE (var) == SSA_NAME)
1335 int part = var_to_partition (SA.map, var);
1336 if (part != NO_PARTITION)
1338 rtx x = SA.partition_to_pseudo[part];
1339 gcc_assert (x);
1340 gcc_assert (MEM_P (x));
1341 return;
1345 return expand_one_stack_var_1 (var);
1348 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1349 that will reside in a hard register. */
1351 static void
1352 expand_one_hard_reg_var (tree var)
1354 rest_of_decl_compilation (var, 0, 0);
1357 /* Record the alignment requirements of some variable assigned to a
1358 pseudo. */
1360 static void
1361 record_alignment_for_reg_var (unsigned int align)
1363 if (SUPPORTS_STACK_ALIGNMENT
1364 && crtl->stack_alignment_estimated < align)
1366 /* stack_alignment_estimated shouldn't change after stack
1367 realign decision made */
1368 gcc_assert (!crtl->stack_realign_processed);
1369 crtl->stack_alignment_estimated = align;
1372 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1373 So here we only make sure stack_alignment_needed >= align. */
1374 if (crtl->stack_alignment_needed < align)
1375 crtl->stack_alignment_needed = align;
1376 if (crtl->max_used_stack_slot_alignment < align)
1377 crtl->max_used_stack_slot_alignment = align;
1380 /* Create RTL for an SSA partition. */
1382 static void
1383 expand_one_ssa_partition (tree var)
1385 int part = var_to_partition (SA.map, var);
1386 gcc_assert (part != NO_PARTITION);
1388 if (SA.partition_to_pseudo[part])
1389 return;
1391 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1392 TYPE_MODE (TREE_TYPE (var)),
1393 TYPE_ALIGN (TREE_TYPE (var)));
1395 /* If the variable alignment is very large we'll dynamicaly allocate
1396 it, which means that in-frame portion is just a pointer. */
1397 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1398 align = GET_MODE_ALIGNMENT (Pmode);
1400 record_alignment_for_reg_var (align);
1402 if (!use_register_for_decl (var))
1404 if (defer_stack_allocation (var, true))
1405 add_stack_var (var);
1406 else
1407 expand_one_stack_var_1 (var);
1408 return;
1411 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1412 rtx x = gen_reg_rtx (reg_mode);
1414 set_rtl (var, x);
1416 /* For a promoted variable, X will not be used directly but wrapped in a
1417 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1418 will assume that its upper bits can be inferred from its lower bits.
1419 Therefore, if X isn't initialized on every path from the entry, then
1420 we must do it manually in order to fulfill the above assumption. */
1421 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1422 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1423 emit_move_insn (x, CONST0_RTX (reg_mode));
1426 /* Record the association between the RTL generated for partition PART
1427 and the underlying variable of the SSA_NAME VAR. */
1429 static void
1430 adjust_one_expanded_partition_var (tree var)
1432 if (!var)
1433 return;
1435 tree decl = SSA_NAME_VAR (var);
1437 int part = var_to_partition (SA.map, var);
1438 if (part == NO_PARTITION)
1439 return;
1441 rtx x = SA.partition_to_pseudo[part];
1443 gcc_assert (x);
1445 set_rtl (var, x);
1447 if (!REG_P (x))
1448 return;
1450 /* Note if the object is a user variable. */
1451 if (decl && !DECL_ARTIFICIAL (decl))
1452 mark_user_reg (x);
1454 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1455 mark_reg_pointer (x, get_pointer_alignment (var));
1458 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1459 that will reside in a pseudo register. */
1461 static void
1462 expand_one_register_var (tree var)
1464 if (TREE_CODE (var) == SSA_NAME)
1466 int part = var_to_partition (SA.map, var);
1467 if (part != NO_PARTITION)
1469 rtx x = SA.partition_to_pseudo[part];
1470 gcc_assert (x);
1471 gcc_assert (REG_P (x));
1472 return;
1474 gcc_unreachable ();
1477 tree decl = var;
1478 tree type = TREE_TYPE (decl);
1479 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1480 rtx x = gen_reg_rtx (reg_mode);
1482 set_rtl (var, x);
1484 /* Note if the object is a user variable. */
1485 if (!DECL_ARTIFICIAL (decl))
1486 mark_user_reg (x);
1488 if (POINTER_TYPE_P (type))
1489 mark_reg_pointer (x, get_pointer_alignment (var));
1492 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1493 has some associated error, e.g. its type is error-mark. We just need
1494 to pick something that won't crash the rest of the compiler. */
1496 static void
1497 expand_one_error_var (tree var)
1499 machine_mode mode = DECL_MODE (var);
1500 rtx x;
1502 if (mode == BLKmode)
1503 x = gen_rtx_MEM (BLKmode, const0_rtx);
1504 else if (mode == VOIDmode)
1505 x = const0_rtx;
1506 else
1507 x = gen_reg_rtx (mode);
1509 SET_DECL_RTL (var, x);
1512 /* A subroutine of expand_one_var. VAR is a variable that will be
1513 allocated to the local stack frame. Return true if we wish to
1514 add VAR to STACK_VARS so that it will be coalesced with other
1515 variables. Return false to allocate VAR immediately.
1517 This function is used to reduce the number of variables considered
1518 for coalescing, which reduces the size of the quadratic problem. */
1520 static bool
1521 defer_stack_allocation (tree var, bool toplevel)
1523 tree size_unit = TREE_CODE (var) == SSA_NAME
1524 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1525 : DECL_SIZE_UNIT (var);
1526 poly_uint64 size;
1528 /* Whether the variable is small enough for immediate allocation not to be
1529 a problem with regard to the frame size. */
1530 bool smallish
1531 = (poly_int_tree_p (size_unit, &size)
1532 && (estimated_poly_value (size)
1533 < PARAM_VALUE (PARAM_MIN_SIZE_FOR_STACK_SHARING)));
1535 /* If stack protection is enabled, *all* stack variables must be deferred,
1536 so that we can re-order the strings to the top of the frame.
1537 Similarly for Address Sanitizer. */
1538 if (flag_stack_protect || asan_sanitize_stack_p ())
1539 return true;
1541 unsigned int align = TREE_CODE (var) == SSA_NAME
1542 ? TYPE_ALIGN (TREE_TYPE (var))
1543 : DECL_ALIGN (var);
1545 /* We handle "large" alignment via dynamic allocation. We want to handle
1546 this extra complication in only one place, so defer them. */
1547 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1548 return true;
1550 bool ignored = TREE_CODE (var) == SSA_NAME
1551 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1552 : DECL_IGNORED_P (var);
1554 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1555 might be detached from their block and appear at toplevel when we reach
1556 here. We want to coalesce them with variables from other blocks when
1557 the immediate contribution to the frame size would be noticeable. */
1558 if (toplevel && optimize > 0 && ignored && !smallish)
1559 return true;
1561 /* Variables declared in the outermost scope automatically conflict
1562 with every other variable. The only reason to want to defer them
1563 at all is that, after sorting, we can more efficiently pack
1564 small variables in the stack frame. Continue to defer at -O2. */
1565 if (toplevel && optimize < 2)
1566 return false;
1568 /* Without optimization, *most* variables are allocated from the
1569 stack, which makes the quadratic problem large exactly when we
1570 want compilation to proceed as quickly as possible. On the
1571 other hand, we don't want the function's stack frame size to
1572 get completely out of hand. So we avoid adding scalars and
1573 "small" aggregates to the list at all. */
1574 if (optimize == 0 && smallish)
1575 return false;
1577 return true;
1580 /* A subroutine of expand_used_vars. Expand one variable according to
1581 its flavor. Variables to be placed on the stack are not actually
1582 expanded yet, merely recorded.
1583 When REALLY_EXPAND is false, only add stack values to be allocated.
1584 Return stack usage this variable is supposed to take.
1587 static poly_uint64
1588 expand_one_var (tree var, bool toplevel, bool really_expand)
1590 unsigned int align = BITS_PER_UNIT;
1591 tree origvar = var;
1593 var = SSAVAR (var);
1595 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1597 if (is_global_var (var))
1598 return 0;
1600 /* Because we don't know if VAR will be in register or on stack,
1601 we conservatively assume it will be on stack even if VAR is
1602 eventually put into register after RA pass. For non-automatic
1603 variables, which won't be on stack, we collect alignment of
1604 type and ignore user specified alignment. Similarly for
1605 SSA_NAMEs for which use_register_for_decl returns true. */
1606 if (TREE_STATIC (var)
1607 || DECL_EXTERNAL (var)
1608 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1609 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1610 TYPE_MODE (TREE_TYPE (var)),
1611 TYPE_ALIGN (TREE_TYPE (var)));
1612 else if (DECL_HAS_VALUE_EXPR_P (var)
1613 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1614 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1615 or variables which were assigned a stack slot already by
1616 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1617 changed from the offset chosen to it. */
1618 align = crtl->stack_alignment_estimated;
1619 else
1620 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1622 /* If the variable alignment is very large we'll dynamicaly allocate
1623 it, which means that in-frame portion is just a pointer. */
1624 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1625 align = GET_MODE_ALIGNMENT (Pmode);
1628 record_alignment_for_reg_var (align);
1630 poly_uint64 size;
1631 if (TREE_CODE (origvar) == SSA_NAME)
1633 gcc_assert (!VAR_P (var)
1634 || (!DECL_EXTERNAL (var)
1635 && !DECL_HAS_VALUE_EXPR_P (var)
1636 && !TREE_STATIC (var)
1637 && TREE_TYPE (var) != error_mark_node
1638 && !DECL_HARD_REGISTER (var)
1639 && really_expand));
1641 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1643 else if (DECL_EXTERNAL (var))
1645 else if (DECL_HAS_VALUE_EXPR_P (var))
1647 else if (TREE_STATIC (var))
1649 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1651 else if (TREE_TYPE (var) == error_mark_node)
1653 if (really_expand)
1654 expand_one_error_var (var);
1656 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1658 if (really_expand)
1660 expand_one_hard_reg_var (var);
1661 if (!DECL_HARD_REGISTER (var))
1662 /* Invalid register specification. */
1663 expand_one_error_var (var);
1666 else if (use_register_for_decl (var))
1668 if (really_expand)
1669 expand_one_register_var (origvar);
1671 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1672 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1674 /* Reject variables which cover more than half of the address-space. */
1675 if (really_expand)
1677 if (DECL_NONLOCAL_FRAME (var))
1678 error_at (DECL_SOURCE_LOCATION (current_function_decl),
1679 "total size of local objects is too large");
1680 else
1681 error_at (DECL_SOURCE_LOCATION (var),
1682 "size of variable %q+D is too large", var);
1683 expand_one_error_var (var);
1686 else if (defer_stack_allocation (var, toplevel))
1687 add_stack_var (origvar);
1688 else
1690 if (really_expand)
1692 if (lookup_attribute ("naked",
1693 DECL_ATTRIBUTES (current_function_decl)))
1694 error ("cannot allocate stack for variable %q+D, naked function.",
1695 var);
1697 expand_one_stack_var (origvar);
1699 return size;
1701 return 0;
1704 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1705 expanding variables. Those variables that can be put into registers
1706 are allocated pseudos; those that can't are put on the stack.
1708 TOPLEVEL is true if this is the outermost BLOCK. */
1710 static void
1711 expand_used_vars_for_block (tree block, bool toplevel)
1713 tree t;
1715 /* Expand all variables at this level. */
1716 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1717 if (TREE_USED (t)
1718 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1719 || !DECL_NONSHAREABLE (t)))
1720 expand_one_var (t, toplevel, true);
1722 /* Expand all variables at containing levels. */
1723 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1724 expand_used_vars_for_block (t, false);
1727 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1728 and clear TREE_USED on all local variables. */
1730 static void
1731 clear_tree_used (tree block)
1733 tree t;
1735 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1736 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1737 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1738 || !DECL_NONSHAREABLE (t))
1739 TREE_USED (t) = 0;
1741 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1742 clear_tree_used (t);
1745 enum {
1746 SPCT_FLAG_DEFAULT = 1,
1747 SPCT_FLAG_ALL = 2,
1748 SPCT_FLAG_STRONG = 3,
1749 SPCT_FLAG_EXPLICIT = 4
1752 /* Examine TYPE and determine a bit mask of the following features. */
1754 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1755 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1756 #define SPCT_HAS_ARRAY 4
1757 #define SPCT_HAS_AGGREGATE 8
1759 static unsigned int
1760 stack_protect_classify_type (tree type)
1762 unsigned int ret = 0;
1763 tree t;
1765 switch (TREE_CODE (type))
1767 case ARRAY_TYPE:
1768 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1769 if (t == char_type_node
1770 || t == signed_char_type_node
1771 || t == unsigned_char_type_node)
1773 unsigned HOST_WIDE_INT max = PARAM_VALUE (PARAM_SSP_BUFFER_SIZE);
1774 unsigned HOST_WIDE_INT len;
1776 if (!TYPE_SIZE_UNIT (type)
1777 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1778 len = max;
1779 else
1780 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1782 if (len < max)
1783 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1784 else
1785 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1787 else
1788 ret = SPCT_HAS_ARRAY;
1789 break;
1791 case UNION_TYPE:
1792 case QUAL_UNION_TYPE:
1793 case RECORD_TYPE:
1794 ret = SPCT_HAS_AGGREGATE;
1795 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1796 if (TREE_CODE (t) == FIELD_DECL)
1797 ret |= stack_protect_classify_type (TREE_TYPE (t));
1798 break;
1800 default:
1801 break;
1804 return ret;
1807 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1808 part of the local stack frame. Remember if we ever return nonzero for
1809 any variable in this function. The return value is the phase number in
1810 which the variable should be allocated. */
1812 static int
1813 stack_protect_decl_phase (tree decl)
1815 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1816 int ret = 0;
1818 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1819 has_short_buffer = true;
1821 if (flag_stack_protect == SPCT_FLAG_ALL
1822 || flag_stack_protect == SPCT_FLAG_STRONG
1823 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1824 && lookup_attribute ("stack_protect",
1825 DECL_ATTRIBUTES (current_function_decl))))
1827 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1828 && !(bits & SPCT_HAS_AGGREGATE))
1829 ret = 1;
1830 else if (bits & SPCT_HAS_ARRAY)
1831 ret = 2;
1833 else
1834 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1836 if (ret)
1837 has_protected_decls = true;
1839 return ret;
1842 /* Two helper routines that check for phase 1 and phase 2. These are used
1843 as callbacks for expand_stack_vars. */
1845 static bool
1846 stack_protect_decl_phase_1 (size_t i)
1848 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1851 static bool
1852 stack_protect_decl_phase_2 (size_t i)
1854 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1857 /* And helper function that checks for asan phase (with stack protector
1858 it is phase 3). This is used as callback for expand_stack_vars.
1859 Returns true if any of the vars in the partition need to be protected. */
1861 static bool
1862 asan_decl_phase_3 (size_t i)
1864 while (i != EOC)
1866 if (asan_protect_stack_decl (stack_vars[i].decl))
1867 return true;
1868 i = stack_vars[i].next;
1870 return false;
1873 /* Ensure that variables in different stack protection phases conflict
1874 so that they are not merged and share the same stack slot. */
1876 static void
1877 add_stack_protection_conflicts (void)
1879 size_t i, j, n = stack_vars_num;
1880 unsigned char *phase;
1882 phase = XNEWVEC (unsigned char, n);
1883 for (i = 0; i < n; ++i)
1884 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1886 for (i = 0; i < n; ++i)
1888 unsigned char ph_i = phase[i];
1889 for (j = i + 1; j < n; ++j)
1890 if (ph_i != phase[j])
1891 add_stack_var_conflict (i, j);
1894 XDELETEVEC (phase);
1897 /* Create a decl for the guard at the top of the stack frame. */
1899 static void
1900 create_stack_guard (void)
1902 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1903 VAR_DECL, NULL, ptr_type_node);
1904 TREE_THIS_VOLATILE (guard) = 1;
1905 TREE_USED (guard) = 1;
1906 expand_one_stack_var (guard);
1907 crtl->stack_protect_guard = guard;
1910 /* Prepare for expanding variables. */
1911 static void
1912 init_vars_expansion (void)
1914 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1915 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1917 /* A map from decl to stack partition. */
1918 decl_to_stack_part = new hash_map<tree, size_t>;
1920 /* Initialize local stack smashing state. */
1921 has_protected_decls = false;
1922 has_short_buffer = false;
1925 /* Free up stack variable graph data. */
1926 static void
1927 fini_vars_expansion (void)
1929 bitmap_obstack_release (&stack_var_bitmap_obstack);
1930 if (stack_vars)
1931 XDELETEVEC (stack_vars);
1932 if (stack_vars_sorted)
1933 XDELETEVEC (stack_vars_sorted);
1934 stack_vars = NULL;
1935 stack_vars_sorted = NULL;
1936 stack_vars_alloc = stack_vars_num = 0;
1937 delete decl_to_stack_part;
1938 decl_to_stack_part = NULL;
1941 /* Make a fair guess for the size of the stack frame of the function
1942 in NODE. This doesn't have to be exact, the result is only used in
1943 the inline heuristics. So we don't want to run the full stack var
1944 packing algorithm (which is quadratic in the number of stack vars).
1945 Instead, we calculate the total size of all stack vars. This turns
1946 out to be a pretty fair estimate -- packing of stack vars doesn't
1947 happen very often. */
1949 HOST_WIDE_INT
1950 estimated_stack_frame_size (struct cgraph_node *node)
1952 poly_int64 size = 0;
1953 size_t i;
1954 tree var;
1955 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1957 push_cfun (fn);
1959 init_vars_expansion ();
1961 FOR_EACH_LOCAL_DECL (fn, i, var)
1962 if (auto_var_in_fn_p (var, fn->decl))
1963 size += expand_one_var (var, true, false);
1965 if (stack_vars_num > 0)
1967 /* Fake sorting the stack vars for account_stack_vars (). */
1968 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1969 for (i = 0; i < stack_vars_num; ++i)
1970 stack_vars_sorted[i] = i;
1971 size += account_stack_vars ();
1974 fini_vars_expansion ();
1975 pop_cfun ();
1976 return estimated_poly_value (size);
1979 /* Helper routine to check if a record or union contains an array field. */
1981 static int
1982 record_or_union_type_has_array_p (const_tree tree_type)
1984 tree fields = TYPE_FIELDS (tree_type);
1985 tree f;
1987 for (f = fields; f; f = DECL_CHAIN (f))
1988 if (TREE_CODE (f) == FIELD_DECL)
1990 tree field_type = TREE_TYPE (f);
1991 if (RECORD_OR_UNION_TYPE_P (field_type)
1992 && record_or_union_type_has_array_p (field_type))
1993 return 1;
1994 if (TREE_CODE (field_type) == ARRAY_TYPE)
1995 return 1;
1997 return 0;
2000 /* Check if the current function has local referenced variables that
2001 have their addresses taken, contain an array, or are arrays. */
2003 static bool
2004 stack_protect_decl_p ()
2006 unsigned i;
2007 tree var;
2009 FOR_EACH_LOCAL_DECL (cfun, i, var)
2010 if (!is_global_var (var))
2012 tree var_type = TREE_TYPE (var);
2013 if (VAR_P (var)
2014 && (TREE_CODE (var_type) == ARRAY_TYPE
2015 || TREE_ADDRESSABLE (var)
2016 || (RECORD_OR_UNION_TYPE_P (var_type)
2017 && record_or_union_type_has_array_p (var_type))))
2018 return true;
2020 return false;
2023 /* Check if the current function has calls that use a return slot. */
2025 static bool
2026 stack_protect_return_slot_p ()
2028 basic_block bb;
2030 FOR_ALL_BB_FN (bb, cfun)
2031 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2032 !gsi_end_p (gsi); gsi_next (&gsi))
2034 gimple *stmt = gsi_stmt (gsi);
2035 /* This assumes that calls to internal-only functions never
2036 use a return slot. */
2037 if (is_gimple_call (stmt)
2038 && !gimple_call_internal_p (stmt)
2039 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2040 gimple_call_fndecl (stmt)))
2041 return true;
2043 return false;
2046 /* Expand all variables used in the function. */
2048 static rtx_insn *
2049 expand_used_vars (void)
2051 tree var, outer_block = DECL_INITIAL (current_function_decl);
2052 auto_vec<tree> maybe_local_decls;
2053 rtx_insn *var_end_seq = NULL;
2054 unsigned i;
2055 unsigned len;
2056 bool gen_stack_protect_signal = false;
2058 /* Compute the phase of the stack frame for this function. */
2060 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2061 int off = targetm.starting_frame_offset () % align;
2062 frame_phase = off ? align - off : 0;
2065 /* Set TREE_USED on all variables in the local_decls. */
2066 FOR_EACH_LOCAL_DECL (cfun, i, var)
2067 TREE_USED (var) = 1;
2068 /* Clear TREE_USED on all variables associated with a block scope. */
2069 clear_tree_used (DECL_INITIAL (current_function_decl));
2071 init_vars_expansion ();
2073 if (targetm.use_pseudo_pic_reg ())
2074 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2076 for (i = 0; i < SA.map->num_partitions; i++)
2078 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2079 continue;
2081 tree var = partition_to_var (SA.map, i);
2083 gcc_assert (!virtual_operand_p (var));
2085 expand_one_ssa_partition (var);
2088 if (flag_stack_protect == SPCT_FLAG_STRONG)
2089 gen_stack_protect_signal
2090 = stack_protect_decl_p () || stack_protect_return_slot_p ();
2092 /* At this point all variables on the local_decls with TREE_USED
2093 set are not associated with any block scope. Lay them out. */
2095 len = vec_safe_length (cfun->local_decls);
2096 FOR_EACH_LOCAL_DECL (cfun, i, var)
2098 bool expand_now = false;
2100 /* Expanded above already. */
2101 if (is_gimple_reg (var))
2103 TREE_USED (var) = 0;
2104 goto next;
2106 /* We didn't set a block for static or extern because it's hard
2107 to tell the difference between a global variable (re)declared
2108 in a local scope, and one that's really declared there to
2109 begin with. And it doesn't really matter much, since we're
2110 not giving them stack space. Expand them now. */
2111 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2112 expand_now = true;
2114 /* Expand variables not associated with any block now. Those created by
2115 the optimizers could be live anywhere in the function. Those that
2116 could possibly have been scoped originally and detached from their
2117 block will have their allocation deferred so we coalesce them with
2118 others when optimization is enabled. */
2119 else if (TREE_USED (var))
2120 expand_now = true;
2122 /* Finally, mark all variables on the list as used. We'll use
2123 this in a moment when we expand those associated with scopes. */
2124 TREE_USED (var) = 1;
2126 if (expand_now)
2127 expand_one_var (var, true, true);
2129 next:
2130 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2132 rtx rtl = DECL_RTL_IF_SET (var);
2134 /* Keep artificial non-ignored vars in cfun->local_decls
2135 chain until instantiate_decls. */
2136 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2137 add_local_decl (cfun, var);
2138 else if (rtl == NULL_RTX)
2139 /* If rtl isn't set yet, which can happen e.g. with
2140 -fstack-protector, retry before returning from this
2141 function. */
2142 maybe_local_decls.safe_push (var);
2146 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2148 +-----------------+-----------------+
2149 | ...processed... | ...duplicates...|
2150 +-----------------+-----------------+
2152 +-- LEN points here.
2154 We just want the duplicates, as those are the artificial
2155 non-ignored vars that we want to keep until instantiate_decls.
2156 Move them down and truncate the array. */
2157 if (!vec_safe_is_empty (cfun->local_decls))
2158 cfun->local_decls->block_remove (0, len);
2160 /* At this point, all variables within the block tree with TREE_USED
2161 set are actually used by the optimized function. Lay them out. */
2162 expand_used_vars_for_block (outer_block, true);
2164 if (stack_vars_num > 0)
2166 add_scope_conflicts ();
2168 /* If stack protection is enabled, we don't share space between
2169 vulnerable data and non-vulnerable data. */
2170 if (flag_stack_protect != 0
2171 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2172 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2173 && lookup_attribute ("stack_protect",
2174 DECL_ATTRIBUTES (current_function_decl)))))
2175 add_stack_protection_conflicts ();
2177 /* Now that we have collected all stack variables, and have computed a
2178 minimal interference graph, attempt to save some stack space. */
2179 partition_stack_vars ();
2180 if (dump_file)
2181 dump_stack_var_partition ();
2184 switch (flag_stack_protect)
2186 case SPCT_FLAG_ALL:
2187 create_stack_guard ();
2188 break;
2190 case SPCT_FLAG_STRONG:
2191 if (gen_stack_protect_signal
2192 || cfun->calls_alloca || has_protected_decls
2193 || lookup_attribute ("stack_protect",
2194 DECL_ATTRIBUTES (current_function_decl)))
2195 create_stack_guard ();
2196 break;
2198 case SPCT_FLAG_DEFAULT:
2199 if (cfun->calls_alloca || has_protected_decls
2200 || lookup_attribute ("stack_protect",
2201 DECL_ATTRIBUTES (current_function_decl)))
2202 create_stack_guard ();
2203 break;
2205 case SPCT_FLAG_EXPLICIT:
2206 if (lookup_attribute ("stack_protect",
2207 DECL_ATTRIBUTES (current_function_decl)))
2208 create_stack_guard ();
2209 break;
2210 default:
2214 /* Assign rtl to each variable based on these partitions. */
2215 if (stack_vars_num > 0)
2217 struct stack_vars_data data;
2219 data.asan_base = NULL_RTX;
2220 data.asan_alignb = 0;
2222 /* Reorder decls to be protected by iterating over the variables
2223 array multiple times, and allocating out of each phase in turn. */
2224 /* ??? We could probably integrate this into the qsort we did
2225 earlier, such that we naturally see these variables first,
2226 and thus naturally allocate things in the right order. */
2227 if (has_protected_decls)
2229 /* Phase 1 contains only character arrays. */
2230 expand_stack_vars (stack_protect_decl_phase_1, &data);
2232 /* Phase 2 contains other kinds of arrays. */
2233 if (flag_stack_protect == SPCT_FLAG_ALL
2234 || flag_stack_protect == SPCT_FLAG_STRONG
2235 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2236 && lookup_attribute ("stack_protect",
2237 DECL_ATTRIBUTES (current_function_decl))))
2238 expand_stack_vars (stack_protect_decl_phase_2, &data);
2241 if (asan_sanitize_stack_p ())
2242 /* Phase 3, any partitions that need asan protection
2243 in addition to phase 1 and 2. */
2244 expand_stack_vars (asan_decl_phase_3, &data);
2246 /* ASAN description strings don't yet have a syntax for expressing
2247 polynomial offsets. */
2248 HOST_WIDE_INT prev_offset;
2249 if (!data.asan_vec.is_empty ()
2250 && frame_offset.is_constant (&prev_offset))
2252 HOST_WIDE_INT offset, sz, redzonesz;
2253 redzonesz = ASAN_RED_ZONE_SIZE;
2254 sz = data.asan_vec[0] - prev_offset;
2255 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2256 && data.asan_alignb <= 4096
2257 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2258 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2259 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2260 /* Allocating a constant amount of space from a constant
2261 starting offset must give a constant result. */
2262 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2263 .to_constant ());
2264 data.asan_vec.safe_push (prev_offset);
2265 data.asan_vec.safe_push (offset);
2266 /* Leave space for alignment if STRICT_ALIGNMENT. */
2267 if (STRICT_ALIGNMENT)
2268 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2269 << ASAN_SHADOW_SHIFT)
2270 / BITS_PER_UNIT, 1);
2272 var_end_seq
2273 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2274 data.asan_base,
2275 data.asan_alignb,
2276 data.asan_vec.address (),
2277 data.asan_decl_vec.address (),
2278 data.asan_vec.length ());
2281 expand_stack_vars (NULL, &data);
2284 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2285 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2286 virtual_stack_vars_rtx,
2287 var_end_seq);
2289 fini_vars_expansion ();
2291 /* If there were any artificial non-ignored vars without rtl
2292 found earlier, see if deferred stack allocation hasn't assigned
2293 rtl to them. */
2294 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2296 rtx rtl = DECL_RTL_IF_SET (var);
2298 /* Keep artificial non-ignored vars in cfun->local_decls
2299 chain until instantiate_decls. */
2300 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2301 add_local_decl (cfun, var);
2304 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2305 if (STACK_ALIGNMENT_NEEDED)
2307 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2308 if (FRAME_GROWS_DOWNWARD)
2309 frame_offset = aligned_lower_bound (frame_offset, align);
2310 else
2311 frame_offset = aligned_upper_bound (frame_offset, align);
2314 return var_end_seq;
2318 /* If we need to produce a detailed dump, print the tree representation
2319 for STMT to the dump file. SINCE is the last RTX after which the RTL
2320 generated for STMT should have been appended. */
2322 static void
2323 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2325 if (dump_file && (dump_flags & TDF_DETAILS))
2327 fprintf (dump_file, "\n;; ");
2328 print_gimple_stmt (dump_file, stmt, 0,
2329 TDF_SLIM | (dump_flags & TDF_LINENO));
2330 fprintf (dump_file, "\n");
2332 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2336 /* Maps the blocks that do not contain tree labels to rtx labels. */
2338 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2340 /* Returns the label_rtx expression for a label starting basic block BB. */
2342 static rtx_code_label *
2343 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2345 gimple_stmt_iterator gsi;
2346 tree lab;
2348 if (bb->flags & BB_RTL)
2349 return block_label (bb);
2351 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2352 if (elt)
2353 return *elt;
2355 /* Find the tree label if it is present. */
2357 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2359 glabel *lab_stmt;
2361 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2362 if (!lab_stmt)
2363 break;
2365 lab = gimple_label_label (lab_stmt);
2366 if (DECL_NONLOCAL (lab))
2367 break;
2369 return jump_target_rtx (lab);
2372 rtx_code_label *l = gen_label_rtx ();
2373 lab_rtx_for_bb->put (bb, l);
2374 return l;
2378 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2379 of a basic block where we just expanded the conditional at the end,
2380 possibly clean up the CFG and instruction sequence. LAST is the
2381 last instruction before the just emitted jump sequence. */
2383 static void
2384 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2386 /* Special case: when jumpif decides that the condition is
2387 trivial it emits an unconditional jump (and the necessary
2388 barrier). But we still have two edges, the fallthru one is
2389 wrong. purge_dead_edges would clean this up later. Unfortunately
2390 we have to insert insns (and split edges) before
2391 find_many_sub_basic_blocks and hence before purge_dead_edges.
2392 But splitting edges might create new blocks which depend on the
2393 fact that if there are two edges there's no barrier. So the
2394 barrier would get lost and verify_flow_info would ICE. Instead
2395 of auditing all edge splitters to care for the barrier (which
2396 normally isn't there in a cleaned CFG), fix it here. */
2397 if (BARRIER_P (get_last_insn ()))
2399 rtx_insn *insn;
2400 remove_edge (e);
2401 /* Now, we have a single successor block, if we have insns to
2402 insert on the remaining edge we potentially will insert
2403 it at the end of this block (if the dest block isn't feasible)
2404 in order to avoid splitting the edge. This insertion will take
2405 place in front of the last jump. But we might have emitted
2406 multiple jumps (conditional and one unconditional) to the
2407 same destination. Inserting in front of the last one then
2408 is a problem. See PR 40021. We fix this by deleting all
2409 jumps except the last unconditional one. */
2410 insn = PREV_INSN (get_last_insn ());
2411 /* Make sure we have an unconditional jump. Otherwise we're
2412 confused. */
2413 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2414 for (insn = PREV_INSN (insn); insn != last;)
2416 insn = PREV_INSN (insn);
2417 if (JUMP_P (NEXT_INSN (insn)))
2419 if (!any_condjump_p (NEXT_INSN (insn)))
2421 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2422 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2424 delete_insn (NEXT_INSN (insn));
2430 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2431 Returns a new basic block if we've terminated the current basic
2432 block and created a new one. */
2434 static basic_block
2435 expand_gimple_cond (basic_block bb, gcond *stmt)
2437 basic_block new_bb, dest;
2438 edge true_edge;
2439 edge false_edge;
2440 rtx_insn *last2, *last;
2441 enum tree_code code;
2442 tree op0, op1;
2444 code = gimple_cond_code (stmt);
2445 op0 = gimple_cond_lhs (stmt);
2446 op1 = gimple_cond_rhs (stmt);
2447 /* We're sometimes presented with such code:
2448 D.123_1 = x < y;
2449 if (D.123_1 != 0)
2451 This would expand to two comparisons which then later might
2452 be cleaned up by combine. But some pattern matchers like if-conversion
2453 work better when there's only one compare, so make up for this
2454 here as special exception if TER would have made the same change. */
2455 if (SA.values
2456 && TREE_CODE (op0) == SSA_NAME
2457 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2458 && TREE_CODE (op1) == INTEGER_CST
2459 && ((gimple_cond_code (stmt) == NE_EXPR
2460 && integer_zerop (op1))
2461 || (gimple_cond_code (stmt) == EQ_EXPR
2462 && integer_onep (op1)))
2463 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2465 gimple *second = SSA_NAME_DEF_STMT (op0);
2466 if (gimple_code (second) == GIMPLE_ASSIGN)
2468 enum tree_code code2 = gimple_assign_rhs_code (second);
2469 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2471 code = code2;
2472 op0 = gimple_assign_rhs1 (second);
2473 op1 = gimple_assign_rhs2 (second);
2475 /* If jumps are cheap and the target does not support conditional
2476 compare, turn some more codes into jumpy sequences. */
2477 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2478 && targetm.gen_ccmp_first == NULL)
2480 if ((code2 == BIT_AND_EXPR
2481 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2482 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2483 || code2 == TRUTH_AND_EXPR)
2485 code = TRUTH_ANDIF_EXPR;
2486 op0 = gimple_assign_rhs1 (second);
2487 op1 = gimple_assign_rhs2 (second);
2489 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2491 code = TRUTH_ORIF_EXPR;
2492 op0 = gimple_assign_rhs1 (second);
2493 op1 = gimple_assign_rhs2 (second);
2499 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2500 into (x - C2) * C3 < C4. */
2501 if ((code == EQ_EXPR || code == NE_EXPR)
2502 && TREE_CODE (op0) == SSA_NAME
2503 && TREE_CODE (op1) == INTEGER_CST)
2504 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2506 last2 = last = get_last_insn ();
2508 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2509 set_curr_insn_location (gimple_location (stmt));
2511 /* These flags have no purpose in RTL land. */
2512 true_edge->flags &= ~EDGE_TRUE_VALUE;
2513 false_edge->flags &= ~EDGE_FALSE_VALUE;
2515 /* We can either have a pure conditional jump with one fallthru edge or
2516 two-way jump that needs to be decomposed into two basic blocks. */
2517 if (false_edge->dest == bb->next_bb)
2519 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2520 true_edge->probability);
2521 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2522 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2523 set_curr_insn_location (true_edge->goto_locus);
2524 false_edge->flags |= EDGE_FALLTHRU;
2525 maybe_cleanup_end_of_block (false_edge, last);
2526 return NULL;
2528 if (true_edge->dest == bb->next_bb)
2530 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2531 false_edge->probability);
2532 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2533 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2534 set_curr_insn_location (false_edge->goto_locus);
2535 true_edge->flags |= EDGE_FALLTHRU;
2536 maybe_cleanup_end_of_block (true_edge, last);
2537 return NULL;
2540 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2541 true_edge->probability);
2542 last = get_last_insn ();
2543 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2544 set_curr_insn_location (false_edge->goto_locus);
2545 emit_jump (label_rtx_for_bb (false_edge->dest));
2547 BB_END (bb) = last;
2548 if (BARRIER_P (BB_END (bb)))
2549 BB_END (bb) = PREV_INSN (BB_END (bb));
2550 update_bb_for_insn (bb);
2552 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2553 dest = false_edge->dest;
2554 redirect_edge_succ (false_edge, new_bb);
2555 false_edge->flags |= EDGE_FALLTHRU;
2556 new_bb->count = false_edge->count ();
2557 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2558 add_bb_to_loop (new_bb, loop);
2559 if (loop->latch == bb
2560 && loop->header == dest)
2561 loop->latch = new_bb;
2562 make_single_succ_edge (new_bb, dest, 0);
2563 if (BARRIER_P (BB_END (new_bb)))
2564 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2565 update_bb_for_insn (new_bb);
2567 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2569 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2571 set_curr_insn_location (true_edge->goto_locus);
2572 true_edge->goto_locus = curr_insn_location ();
2575 return new_bb;
2578 /* Mark all calls that can have a transaction restart. */
2580 static void
2581 mark_transaction_restart_calls (gimple *stmt)
2583 struct tm_restart_node dummy;
2584 tm_restart_node **slot;
2586 if (!cfun->gimple_df->tm_restart)
2587 return;
2589 dummy.stmt = stmt;
2590 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2591 if (slot)
2593 struct tm_restart_node *n = *slot;
2594 tree list = n->label_or_list;
2595 rtx_insn *insn;
2597 for (insn = next_real_insn (get_last_insn ());
2598 !CALL_P (insn);
2599 insn = next_real_insn (insn))
2600 continue;
2602 if (TREE_CODE (list) == LABEL_DECL)
2603 add_reg_note (insn, REG_TM, label_rtx (list));
2604 else
2605 for (; list ; list = TREE_CHAIN (list))
2606 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2610 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2611 statement STMT. */
2613 static void
2614 expand_call_stmt (gcall *stmt)
2616 tree exp, decl, lhs;
2617 bool builtin_p;
2618 size_t i;
2620 if (gimple_call_internal_p (stmt))
2622 expand_internal_call (stmt);
2623 return;
2626 /* If this is a call to a built-in function and it has no effect other
2627 than setting the lhs, try to implement it using an internal function
2628 instead. */
2629 decl = gimple_call_fndecl (stmt);
2630 if (gimple_call_lhs (stmt)
2631 && !gimple_has_side_effects (stmt)
2632 && (optimize || (decl && called_as_built_in (decl))))
2634 internal_fn ifn = replacement_internal_fn (stmt);
2635 if (ifn != IFN_LAST)
2637 expand_internal_call (ifn, stmt);
2638 return;
2642 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2644 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2645 builtin_p = decl && fndecl_built_in_p (decl);
2647 /* If this is not a builtin function, the function type through which the
2648 call is made may be different from the type of the function. */
2649 if (!builtin_p)
2650 CALL_EXPR_FN (exp)
2651 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2652 CALL_EXPR_FN (exp));
2654 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2655 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2657 for (i = 0; i < gimple_call_num_args (stmt); i++)
2659 tree arg = gimple_call_arg (stmt, i);
2660 gimple *def;
2661 /* TER addresses into arguments of builtin functions so we have a
2662 chance to infer more correct alignment information. See PR39954. */
2663 if (builtin_p
2664 && TREE_CODE (arg) == SSA_NAME
2665 && (def = get_gimple_for_ssa_name (arg))
2666 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2667 arg = gimple_assign_rhs1 (def);
2668 CALL_EXPR_ARG (exp, i) = arg;
2671 if (gimple_has_side_effects (stmt))
2672 TREE_SIDE_EFFECTS (exp) = 1;
2674 if (gimple_call_nothrow_p (stmt))
2675 TREE_NOTHROW (exp) = 1;
2677 if (gimple_no_warning_p (stmt))
2678 TREE_NO_WARNING (exp) = 1;
2680 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2681 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2682 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2683 if (decl
2684 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2685 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2686 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2687 else
2688 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2689 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2690 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2691 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2693 /* Ensure RTL is created for debug args. */
2694 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2696 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2697 unsigned int ix;
2698 tree dtemp;
2700 if (debug_args)
2701 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2703 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2704 expand_debug_expr (dtemp);
2708 rtx_insn *before_call = get_last_insn ();
2709 lhs = gimple_call_lhs (stmt);
2710 if (lhs)
2711 expand_assignment (lhs, exp, false);
2712 else
2713 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2715 /* If the gimple call is an indirect call and has 'nocf_check'
2716 attribute find a generated CALL insn to mark it as no
2717 control-flow verification is needed. */
2718 if (gimple_call_nocf_check_p (stmt)
2719 && !gimple_call_fndecl (stmt))
2721 rtx_insn *last = get_last_insn ();
2722 while (!CALL_P (last)
2723 && last != before_call)
2724 last = PREV_INSN (last);
2726 if (last != before_call)
2727 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2730 mark_transaction_restart_calls (stmt);
2734 /* Generate RTL for an asm statement (explicit assembler code).
2735 STRING is a STRING_CST node containing the assembler code text,
2736 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2737 insn is volatile; don't optimize it. */
2739 static void
2740 expand_asm_loc (tree string, int vol, location_t locus)
2742 rtx body;
2744 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2745 ggc_strdup (TREE_STRING_POINTER (string)),
2746 locus);
2748 MEM_VOLATILE_P (body) = vol;
2750 /* Non-empty basic ASM implicitly clobbers memory. */
2751 if (TREE_STRING_LENGTH (string) != 0)
2753 rtx asm_op, clob;
2754 unsigned i, nclobbers;
2755 auto_vec<rtx> input_rvec, output_rvec;
2756 auto_vec<const char *> constraints;
2757 auto_vec<rtx> clobber_rvec;
2758 HARD_REG_SET clobbered_regs;
2759 CLEAR_HARD_REG_SET (clobbered_regs);
2761 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2762 clobber_rvec.safe_push (clob);
2764 if (targetm.md_asm_adjust)
2765 targetm.md_asm_adjust (output_rvec, input_rvec,
2766 constraints, clobber_rvec,
2767 clobbered_regs);
2769 asm_op = body;
2770 nclobbers = clobber_rvec.length ();
2771 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nclobbers));
2773 XVECEXP (body, 0, 0) = asm_op;
2774 for (i = 0; i < nclobbers; i++)
2775 XVECEXP (body, 0, i + 1) = gen_rtx_CLOBBER (VOIDmode, clobber_rvec[i]);
2778 emit_insn (body);
2781 /* Return the number of times character C occurs in string S. */
2782 static int
2783 n_occurrences (int c, const char *s)
2785 int n = 0;
2786 while (*s)
2787 n += (*s++ == c);
2788 return n;
2791 /* A subroutine of expand_asm_operands. Check that all operands have
2792 the same number of alternatives. Return true if so. */
2794 static bool
2795 check_operand_nalternatives (const vec<const char *> &constraints)
2797 unsigned len = constraints.length();
2798 if (len > 0)
2800 int nalternatives = n_occurrences (',', constraints[0]);
2802 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2804 error ("too many alternatives in %<asm%>");
2805 return false;
2808 for (unsigned i = 1; i < len; ++i)
2809 if (n_occurrences (',', constraints[i]) != nalternatives)
2811 error ("operand constraints for %<asm%> differ "
2812 "in number of alternatives");
2813 return false;
2816 return true;
2819 /* Check for overlap between registers marked in CLOBBERED_REGS and
2820 anything inappropriate in T. Emit error and return the register
2821 variable definition for error, NULL_TREE for ok. */
2823 static bool
2824 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2826 /* Conflicts between asm-declared register variables and the clobber
2827 list are not allowed. */
2828 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2830 if (overlap)
2832 error ("asm-specifier for variable %qE conflicts with asm clobber list",
2833 DECL_NAME (overlap));
2835 /* Reset registerness to stop multiple errors emitted for a single
2836 variable. */
2837 DECL_REGISTER (overlap) = 0;
2838 return true;
2841 return false;
2844 /* Generate RTL for an asm statement with arguments.
2845 STRING is the instruction template.
2846 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2847 Each output or input has an expression in the TREE_VALUE and
2848 a tree list in TREE_PURPOSE which in turn contains a constraint
2849 name in TREE_VALUE (or NULL_TREE) and a constraint string
2850 in TREE_PURPOSE.
2851 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2852 that is clobbered by this insn.
2854 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2855 should be the fallthru basic block of the asm goto.
2857 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2858 Some elements of OUTPUTS may be replaced with trees representing temporary
2859 values. The caller should copy those temporary values to the originally
2860 specified lvalues.
2862 VOL nonzero means the insn is volatile; don't optimize it. */
2864 static void
2865 expand_asm_stmt (gasm *stmt)
2867 class save_input_location
2869 location_t old;
2871 public:
2872 explicit save_input_location(location_t where)
2874 old = input_location;
2875 input_location = where;
2878 ~save_input_location()
2880 input_location = old;
2884 location_t locus = gimple_location (stmt);
2886 if (gimple_asm_input_p (stmt))
2888 const char *s = gimple_asm_string (stmt);
2889 tree string = build_string (strlen (s), s);
2890 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
2891 return;
2894 /* There are some legacy diagnostics in here, and also avoids a
2895 sixth parameger to targetm.md_asm_adjust. */
2896 save_input_location s_i_l(locus);
2898 unsigned noutputs = gimple_asm_noutputs (stmt);
2899 unsigned ninputs = gimple_asm_ninputs (stmt);
2900 unsigned nlabels = gimple_asm_nlabels (stmt);
2901 unsigned i;
2903 /* ??? Diagnose during gimplification? */
2904 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
2906 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2907 return;
2910 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
2911 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
2912 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
2914 /* Copy the gimple vectors into new vectors that we can manipulate. */
2916 output_tvec.safe_grow (noutputs);
2917 input_tvec.safe_grow (ninputs);
2918 constraints.safe_grow (noutputs + ninputs);
2920 for (i = 0; i < noutputs; ++i)
2922 tree t = gimple_asm_output_op (stmt, i);
2923 output_tvec[i] = TREE_VALUE (t);
2924 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2926 for (i = 0; i < ninputs; i++)
2928 tree t = gimple_asm_input_op (stmt, i);
2929 input_tvec[i] = TREE_VALUE (t);
2930 constraints[i + noutputs]
2931 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2934 /* ??? Diagnose during gimplification? */
2935 if (! check_operand_nalternatives (constraints))
2936 return;
2938 /* Count the number of meaningful clobbered registers, ignoring what
2939 we would ignore later. */
2940 auto_vec<rtx> clobber_rvec;
2941 HARD_REG_SET clobbered_regs;
2942 CLEAR_HARD_REG_SET (clobbered_regs);
2944 if (unsigned n = gimple_asm_nclobbers (stmt))
2946 clobber_rvec.reserve (n);
2947 for (i = 0; i < n; i++)
2949 tree t = gimple_asm_clobber_op (stmt, i);
2950 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
2951 int nregs, j;
2953 j = decode_reg_name_and_count (regname, &nregs);
2954 if (j < 0)
2956 if (j == -2)
2958 /* ??? Diagnose during gimplification? */
2959 error ("unknown register name %qs in %<asm%>", regname);
2961 else if (j == -4)
2963 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2964 clobber_rvec.safe_push (x);
2966 else
2968 /* Otherwise we should have -1 == empty string
2969 or -3 == cc, which is not a register. */
2970 gcc_assert (j == -1 || j == -3);
2973 else
2974 for (int reg = j; reg < j + nregs; reg++)
2976 /* Clobbering the PIC register is an error. */
2977 if (reg == (int) PIC_OFFSET_TABLE_REGNUM)
2979 /* ??? Diagnose during gimplification? */
2980 error ("PIC register clobbered by %qs in %<asm%>",
2981 regname);
2982 return;
2985 SET_HARD_REG_BIT (clobbered_regs, reg);
2986 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
2987 clobber_rvec.safe_push (x);
2991 unsigned nclobbers = clobber_rvec.length();
2993 /* First pass over inputs and outputs checks validity and sets
2994 mark_addressable if needed. */
2995 /* ??? Diagnose during gimplification? */
2997 for (i = 0; i < noutputs; ++i)
2999 tree val = output_tvec[i];
3000 tree type = TREE_TYPE (val);
3001 const char *constraint;
3002 bool is_inout;
3003 bool allows_reg;
3004 bool allows_mem;
3006 /* Try to parse the output constraint. If that fails, there's
3007 no point in going further. */
3008 constraint = constraints[i];
3009 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
3010 &allows_mem, &allows_reg, &is_inout))
3011 return;
3013 if (! allows_reg
3014 && (allows_mem
3015 || is_inout
3016 || (DECL_P (val)
3017 && REG_P (DECL_RTL (val))
3018 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3019 mark_addressable (val);
3022 for (i = 0; i < ninputs; ++i)
3024 bool allows_reg, allows_mem;
3025 const char *constraint;
3027 constraint = constraints[i + noutputs];
3028 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3029 constraints.address (),
3030 &allows_mem, &allows_reg))
3031 return;
3033 if (! allows_reg && allows_mem)
3034 mark_addressable (input_tvec[i]);
3037 /* Second pass evaluates arguments. */
3039 /* Make sure stack is consistent for asm goto. */
3040 if (nlabels > 0)
3041 do_pending_stack_adjust ();
3042 int old_generating_concat_p = generating_concat_p;
3044 /* Vector of RTX's of evaluated output operands. */
3045 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3046 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3047 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3049 output_rvec.safe_grow (noutputs);
3051 for (i = 0; i < noutputs; ++i)
3053 tree val = output_tvec[i];
3054 tree type = TREE_TYPE (val);
3055 bool is_inout, allows_reg, allows_mem, ok;
3056 rtx op;
3058 ok = parse_output_constraint (&constraints[i], i, ninputs,
3059 noutputs, &allows_mem, &allows_reg,
3060 &is_inout);
3061 gcc_assert (ok);
3063 /* If an output operand is not a decl or indirect ref and our constraint
3064 allows a register, make a temporary to act as an intermediate.
3065 Make the asm insn write into that, then we will copy it to
3066 the real output operand. Likewise for promoted variables. */
3068 generating_concat_p = 0;
3070 if ((TREE_CODE (val) == INDIRECT_REF && allows_mem)
3071 || (DECL_P (val)
3072 && (allows_mem || REG_P (DECL_RTL (val)))
3073 && ! (REG_P (DECL_RTL (val))
3074 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3075 || ! allows_reg
3076 || is_inout
3077 || TREE_ADDRESSABLE (type))
3079 op = expand_expr (val, NULL_RTX, VOIDmode,
3080 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3081 if (MEM_P (op))
3082 op = validize_mem (op);
3084 if (! allows_reg && !MEM_P (op))
3085 error ("output number %d not directly addressable", i);
3086 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3087 || GET_CODE (op) == CONCAT)
3089 rtx old_op = op;
3090 op = gen_reg_rtx (GET_MODE (op));
3092 generating_concat_p = old_generating_concat_p;
3094 if (is_inout)
3095 emit_move_insn (op, old_op);
3097 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3098 emit_move_insn (old_op, op);
3099 after_rtl_seq = get_insns ();
3100 after_rtl_end = get_last_insn ();
3101 end_sequence ();
3104 else
3106 op = assign_temp (type, 0, 1);
3107 op = validize_mem (op);
3108 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3109 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3111 generating_concat_p = old_generating_concat_p;
3113 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3114 expand_assignment (val, make_tree (type, op), false);
3115 after_rtl_seq = get_insns ();
3116 after_rtl_end = get_last_insn ();
3117 end_sequence ();
3119 output_rvec[i] = op;
3121 if (is_inout)
3122 inout_opnum.safe_push (i);
3125 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3126 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3128 input_rvec.safe_grow (ninputs);
3129 input_mode.safe_grow (ninputs);
3131 generating_concat_p = 0;
3133 for (i = 0; i < ninputs; ++i)
3135 tree val = input_tvec[i];
3136 tree type = TREE_TYPE (val);
3137 bool allows_reg, allows_mem, ok;
3138 const char *constraint;
3139 rtx op;
3141 constraint = constraints[i + noutputs];
3142 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3143 constraints.address (),
3144 &allows_mem, &allows_reg);
3145 gcc_assert (ok);
3147 /* EXPAND_INITIALIZER will not generate code for valid initializer
3148 constants, but will still generate code for other types of operand.
3149 This is the behavior we want for constant constraints. */
3150 op = expand_expr (val, NULL_RTX, VOIDmode,
3151 allows_reg ? EXPAND_NORMAL
3152 : allows_mem ? EXPAND_MEMORY
3153 : EXPAND_INITIALIZER);
3155 /* Never pass a CONCAT to an ASM. */
3156 if (GET_CODE (op) == CONCAT)
3157 op = force_reg (GET_MODE (op), op);
3158 else if (MEM_P (op))
3159 op = validize_mem (op);
3161 if (asm_operand_ok (op, constraint, NULL) <= 0)
3163 if (allows_reg && TYPE_MODE (type) != BLKmode)
3164 op = force_reg (TYPE_MODE (type), op);
3165 else if (!allows_mem)
3166 warning (0, "asm operand %d probably doesn%'t match constraints",
3167 i + noutputs);
3168 else if (MEM_P (op))
3170 /* We won't recognize either volatile memory or memory
3171 with a queued address as available a memory_operand
3172 at this point. Ignore it: clearly this *is* a memory. */
3174 else
3175 gcc_unreachable ();
3177 input_rvec[i] = op;
3178 input_mode[i] = TYPE_MODE (type);
3181 /* For in-out operands, copy output rtx to input rtx. */
3182 unsigned ninout = inout_opnum.length();
3183 for (i = 0; i < ninout; i++)
3185 int j = inout_opnum[i];
3186 rtx o = output_rvec[j];
3188 input_rvec.safe_push (o);
3189 input_mode.safe_push (GET_MODE (o));
3191 char buffer[16];
3192 sprintf (buffer, "%d", j);
3193 constraints.safe_push (ggc_strdup (buffer));
3195 ninputs += ninout;
3197 /* Sometimes we wish to automatically clobber registers across an asm.
3198 Case in point is when the i386 backend moved from cc0 to a hard reg --
3199 maintaining source-level compatibility means automatically clobbering
3200 the flags register. */
3201 rtx_insn *after_md_seq = NULL;
3202 if (targetm.md_asm_adjust)
3203 after_md_seq = targetm.md_asm_adjust (output_rvec, input_rvec,
3204 constraints, clobber_rvec,
3205 clobbered_regs);
3207 /* Do not allow the hook to change the output and input count,
3208 lest it mess up the operand numbering. */
3209 gcc_assert (output_rvec.length() == noutputs);
3210 gcc_assert (input_rvec.length() == ninputs);
3211 gcc_assert (constraints.length() == noutputs + ninputs);
3213 /* But it certainly can adjust the clobbers. */
3214 nclobbers = clobber_rvec.length();
3216 /* Third pass checks for easy conflicts. */
3217 /* ??? Why are we doing this on trees instead of rtx. */
3219 bool clobber_conflict_found = 0;
3220 for (i = 0; i < noutputs; ++i)
3221 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3222 clobber_conflict_found = 1;
3223 for (i = 0; i < ninputs - ninout; ++i)
3224 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3225 clobber_conflict_found = 1;
3227 /* Make vectors for the expression-rtx, constraint strings,
3228 and named operands. */
3230 rtvec argvec = rtvec_alloc (ninputs);
3231 rtvec constraintvec = rtvec_alloc (ninputs);
3232 rtvec labelvec = rtvec_alloc (nlabels);
3234 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3235 : GET_MODE (output_rvec[0])),
3236 ggc_strdup (gimple_asm_string (stmt)),
3237 "", 0, argvec, constraintvec,
3238 labelvec, locus);
3239 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3241 for (i = 0; i < ninputs; ++i)
3243 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3244 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3245 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3246 constraints[i + noutputs],
3247 locus);
3250 /* Copy labels to the vector. */
3251 rtx_code_label *fallthru_label = NULL;
3252 if (nlabels > 0)
3254 basic_block fallthru_bb = NULL;
3255 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3256 if (fallthru)
3257 fallthru_bb = fallthru->dest;
3259 for (i = 0; i < nlabels; ++i)
3261 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3262 rtx_insn *r;
3263 /* If asm goto has any labels in the fallthru basic block, use
3264 a label that we emit immediately after the asm goto. Expansion
3265 may insert further instructions into the same basic block after
3266 asm goto and if we don't do this, insertion of instructions on
3267 the fallthru edge might misbehave. See PR58670. */
3268 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3270 if (fallthru_label == NULL_RTX)
3271 fallthru_label = gen_label_rtx ();
3272 r = fallthru_label;
3274 else
3275 r = label_rtx (label);
3276 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3280 /* Now, for each output, construct an rtx
3281 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3282 ARGVEC CONSTRAINTS OPNAMES))
3283 If there is more than one, put them inside a PARALLEL. */
3285 if (nlabels > 0 && nclobbers == 0)
3287 gcc_assert (noutputs == 0);
3288 emit_jump_insn (body);
3290 else if (noutputs == 0 && nclobbers == 0)
3292 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3293 emit_insn (body);
3295 else if (noutputs == 1 && nclobbers == 0)
3297 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3298 emit_insn (gen_rtx_SET (output_rvec[0], body));
3300 else
3302 rtx obody = body;
3303 int num = noutputs;
3305 if (num == 0)
3306 num = 1;
3308 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3310 /* For each output operand, store a SET. */
3311 for (i = 0; i < noutputs; ++i)
3313 rtx src, o = output_rvec[i];
3314 if (i == 0)
3316 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3317 src = obody;
3319 else
3321 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3322 ASM_OPERANDS_TEMPLATE (obody),
3323 constraints[i], i, argvec,
3324 constraintvec, labelvec, locus);
3325 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3327 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3330 /* If there are no outputs (but there are some clobbers)
3331 store the bare ASM_OPERANDS into the PARALLEL. */
3332 if (i == 0)
3333 XVECEXP (body, 0, i++) = obody;
3335 /* Store (clobber REG) for each clobbered register specified. */
3336 for (unsigned j = 0; j < nclobbers; ++j)
3338 rtx clobbered_reg = clobber_rvec[j];
3340 /* Do sanity check for overlap between clobbers and respectively
3341 input and outputs that hasn't been handled. Such overlap
3342 should have been detected and reported above. */
3343 if (!clobber_conflict_found && REG_P (clobbered_reg))
3345 /* We test the old body (obody) contents to avoid
3346 tripping over the under-construction body. */
3347 for (unsigned k = 0; k < noutputs; ++k)
3348 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3349 internal_error ("asm clobber conflict with output operand");
3351 for (unsigned k = 0; k < ninputs - ninout; ++k)
3352 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3353 internal_error ("asm clobber conflict with input operand");
3356 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3359 if (nlabels > 0)
3360 emit_jump_insn (body);
3361 else
3362 emit_insn (body);
3365 generating_concat_p = old_generating_concat_p;
3367 if (fallthru_label)
3368 emit_label (fallthru_label);
3370 if (after_md_seq)
3371 emit_insn (after_md_seq);
3372 if (after_rtl_seq)
3373 emit_insn (after_rtl_seq);
3375 free_temp_slots ();
3376 crtl->has_asm_statement = 1;
3379 /* Emit code to jump to the address
3380 specified by the pointer expression EXP. */
3382 static void
3383 expand_computed_goto (tree exp)
3385 rtx x = expand_normal (exp);
3387 do_pending_stack_adjust ();
3388 emit_indirect_jump (x);
3391 /* Generate RTL code for a `goto' statement with target label LABEL.
3392 LABEL should be a LABEL_DECL tree node that was or will later be
3393 defined with `expand_label'. */
3395 static void
3396 expand_goto (tree label)
3398 if (flag_checking)
3400 /* Check for a nonlocal goto to a containing function. Should have
3401 gotten translated to __builtin_nonlocal_goto. */
3402 tree context = decl_function_context (label);
3403 gcc_assert (!context || context == current_function_decl);
3406 emit_jump (jump_target_rtx (label));
3409 /* Output a return with no value. */
3411 static void
3412 expand_null_return_1 (void)
3414 clear_pending_stack_adjust ();
3415 do_pending_stack_adjust ();
3416 emit_jump (return_label);
3419 /* Generate RTL to return from the current function, with no value.
3420 (That is, we do not do anything about returning any value.) */
3422 void
3423 expand_null_return (void)
3425 /* If this function was declared to return a value, but we
3426 didn't, clobber the return registers so that they are not
3427 propagated live to the rest of the function. */
3428 clobber_return_register ();
3430 expand_null_return_1 ();
3433 /* Generate RTL to return from the current function, with value VAL. */
3435 static void
3436 expand_value_return (rtx val)
3438 /* Copy the value to the return location unless it's already there. */
3440 tree decl = DECL_RESULT (current_function_decl);
3441 rtx return_reg = DECL_RTL (decl);
3442 if (return_reg != val)
3444 tree funtype = TREE_TYPE (current_function_decl);
3445 tree type = TREE_TYPE (decl);
3446 int unsignedp = TYPE_UNSIGNED (type);
3447 machine_mode old_mode = DECL_MODE (decl);
3448 machine_mode mode;
3449 if (DECL_BY_REFERENCE (decl))
3450 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3451 else
3452 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3454 if (mode != old_mode)
3455 val = convert_modes (mode, old_mode, val, unsignedp);
3457 if (GET_CODE (return_reg) == PARALLEL)
3458 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3459 else
3460 emit_move_insn (return_reg, val);
3463 expand_null_return_1 ();
3466 /* Generate RTL to evaluate the expression RETVAL and return it
3467 from the current function. */
3469 static void
3470 expand_return (tree retval)
3472 rtx result_rtl;
3473 rtx val = 0;
3474 tree retval_rhs;
3476 /* If function wants no value, give it none. */
3477 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3479 expand_normal (retval);
3480 expand_null_return ();
3481 return;
3484 if (retval == error_mark_node)
3486 /* Treat this like a return of no value from a function that
3487 returns a value. */
3488 expand_null_return ();
3489 return;
3491 else if ((TREE_CODE (retval) == MODIFY_EXPR
3492 || TREE_CODE (retval) == INIT_EXPR)
3493 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3494 retval_rhs = TREE_OPERAND (retval, 1);
3495 else
3496 retval_rhs = retval;
3498 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3500 /* If we are returning the RESULT_DECL, then the value has already
3501 been stored into it, so we don't have to do anything special. */
3502 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3503 expand_value_return (result_rtl);
3505 /* If the result is an aggregate that is being returned in one (or more)
3506 registers, load the registers here. */
3508 else if (retval_rhs != 0
3509 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3510 && REG_P (result_rtl))
3512 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3513 if (val)
3515 /* Use the mode of the result value on the return register. */
3516 PUT_MODE (result_rtl, GET_MODE (val));
3517 expand_value_return (val);
3519 else
3520 expand_null_return ();
3522 else if (retval_rhs != 0
3523 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3524 && (REG_P (result_rtl)
3525 || (GET_CODE (result_rtl) == PARALLEL)))
3527 /* Compute the return value into a temporary (usually a pseudo reg). */
3529 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3530 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3531 val = force_not_mem (val);
3532 expand_value_return (val);
3534 else
3536 /* No hard reg used; calculate value into hard return reg. */
3537 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3538 expand_value_return (result_rtl);
3542 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3543 register, tell the rtl optimizers that its value is no longer
3544 needed. */
3546 static void
3547 expand_clobber (tree lhs)
3549 if (DECL_P (lhs))
3551 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3552 if (decl_rtl && REG_P (decl_rtl))
3554 machine_mode decl_mode = GET_MODE (decl_rtl);
3555 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3556 REGMODE_NATURAL_SIZE (decl_mode)))
3557 emit_clobber (decl_rtl);
3562 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3563 STMT that doesn't require special handling for outgoing edges. That
3564 is no tailcalls and no GIMPLE_COND. */
3566 static void
3567 expand_gimple_stmt_1 (gimple *stmt)
3569 tree op0;
3571 set_curr_insn_location (gimple_location (stmt));
3573 switch (gimple_code (stmt))
3575 case GIMPLE_GOTO:
3576 op0 = gimple_goto_dest (stmt);
3577 if (TREE_CODE (op0) == LABEL_DECL)
3578 expand_goto (op0);
3579 else
3580 expand_computed_goto (op0);
3581 break;
3582 case GIMPLE_LABEL:
3583 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3584 break;
3585 case GIMPLE_NOP:
3586 case GIMPLE_PREDICT:
3587 break;
3588 case GIMPLE_SWITCH:
3590 gswitch *swtch = as_a <gswitch *> (stmt);
3591 if (gimple_switch_num_labels (swtch) == 1)
3592 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3593 else
3594 expand_case (swtch);
3596 break;
3597 case GIMPLE_ASM:
3598 expand_asm_stmt (as_a <gasm *> (stmt));
3599 break;
3600 case GIMPLE_CALL:
3601 expand_call_stmt (as_a <gcall *> (stmt));
3602 break;
3604 case GIMPLE_RETURN:
3606 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3608 if (op0 && op0 != error_mark_node)
3610 tree result = DECL_RESULT (current_function_decl);
3612 /* If we are not returning the current function's RESULT_DECL,
3613 build an assignment to it. */
3614 if (op0 != result)
3616 /* I believe that a function's RESULT_DECL is unique. */
3617 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3619 /* ??? We'd like to use simply expand_assignment here,
3620 but this fails if the value is of BLKmode but the return
3621 decl is a register. expand_return has special handling
3622 for this combination, which eventually should move
3623 to common code. See comments there. Until then, let's
3624 build a modify expression :-/ */
3625 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3626 result, op0);
3630 if (!op0)
3631 expand_null_return ();
3632 else
3633 expand_return (op0);
3635 break;
3637 case GIMPLE_ASSIGN:
3639 gassign *assign_stmt = as_a <gassign *> (stmt);
3640 tree lhs = gimple_assign_lhs (assign_stmt);
3642 /* Tree expand used to fiddle with |= and &= of two bitfield
3643 COMPONENT_REFs here. This can't happen with gimple, the LHS
3644 of binary assigns must be a gimple reg. */
3646 if (TREE_CODE (lhs) != SSA_NAME
3647 || get_gimple_rhs_class (gimple_expr_code (stmt))
3648 == GIMPLE_SINGLE_RHS)
3650 tree rhs = gimple_assign_rhs1 (assign_stmt);
3651 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt))
3652 == GIMPLE_SINGLE_RHS);
3653 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3654 /* Do not put locations on possibly shared trees. */
3655 && !is_gimple_min_invariant (rhs))
3656 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3657 if (TREE_CLOBBER_P (rhs))
3658 /* This is a clobber to mark the going out of scope for
3659 this LHS. */
3660 expand_clobber (lhs);
3661 else
3662 expand_assignment (lhs, rhs,
3663 gimple_assign_nontemporal_move_p (
3664 assign_stmt));
3666 else
3668 rtx target, temp;
3669 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3670 struct separate_ops ops;
3671 bool promoted = false;
3673 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3674 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3675 promoted = true;
3677 ops.code = gimple_assign_rhs_code (assign_stmt);
3678 ops.type = TREE_TYPE (lhs);
3679 switch (get_gimple_rhs_class (ops.code))
3681 case GIMPLE_TERNARY_RHS:
3682 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3683 /* Fallthru */
3684 case GIMPLE_BINARY_RHS:
3685 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3686 /* Fallthru */
3687 case GIMPLE_UNARY_RHS:
3688 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3689 break;
3690 default:
3691 gcc_unreachable ();
3693 ops.location = gimple_location (stmt);
3695 /* If we want to use a nontemporal store, force the value to
3696 register first. If we store into a promoted register,
3697 don't directly expand to target. */
3698 temp = nontemporal || promoted ? NULL_RTX : target;
3699 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3700 EXPAND_NORMAL);
3702 if (temp == target)
3704 else if (promoted)
3706 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3707 /* If TEMP is a VOIDmode constant, use convert_modes to make
3708 sure that we properly convert it. */
3709 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3711 temp = convert_modes (GET_MODE (target),
3712 TYPE_MODE (ops.type),
3713 temp, unsignedp);
3714 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3715 GET_MODE (target), temp, unsignedp);
3718 convert_move (SUBREG_REG (target), temp, unsignedp);
3720 else if (nontemporal && emit_storent_insn (target, temp))
3722 else
3724 temp = force_operand (temp, target);
3725 if (temp != target)
3726 emit_move_insn (target, temp);
3730 break;
3732 default:
3733 gcc_unreachable ();
3737 /* Expand one gimple statement STMT and return the last RTL instruction
3738 before any of the newly generated ones.
3740 In addition to generating the necessary RTL instructions this also
3741 sets REG_EH_REGION notes if necessary and sets the current source
3742 location for diagnostics. */
3744 static rtx_insn *
3745 expand_gimple_stmt (gimple *stmt)
3747 location_t saved_location = input_location;
3748 rtx_insn *last = get_last_insn ();
3749 int lp_nr;
3751 gcc_assert (cfun);
3753 /* We need to save and restore the current source location so that errors
3754 discovered during expansion are emitted with the right location. But
3755 it would be better if the diagnostic routines used the source location
3756 embedded in the tree nodes rather than globals. */
3757 if (gimple_has_location (stmt))
3758 input_location = gimple_location (stmt);
3760 expand_gimple_stmt_1 (stmt);
3762 /* Free any temporaries used to evaluate this statement. */
3763 free_temp_slots ();
3765 input_location = saved_location;
3767 /* Mark all insns that may trap. */
3768 lp_nr = lookup_stmt_eh_lp (stmt);
3769 if (lp_nr)
3771 rtx_insn *insn;
3772 for (insn = next_real_insn (last); insn;
3773 insn = next_real_insn (insn))
3775 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3776 /* If we want exceptions for non-call insns, any
3777 may_trap_p instruction may throw. */
3778 && GET_CODE (PATTERN (insn)) != CLOBBER
3779 && GET_CODE (PATTERN (insn)) != CLOBBER_HIGH
3780 && GET_CODE (PATTERN (insn)) != USE
3781 && insn_could_throw_p (insn))
3782 make_reg_eh_region_note (insn, 0, lp_nr);
3786 return last;
3789 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3790 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3791 generated a tail call (something that might be denied by the ABI
3792 rules governing the call; see calls.c).
3794 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3795 can still reach the rest of BB. The case here is __builtin_sqrt,
3796 where the NaN result goes through the external function (with a
3797 tailcall) and the normal result happens via a sqrt instruction. */
3799 static basic_block
3800 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
3802 rtx_insn *last2, *last;
3803 edge e;
3804 edge_iterator ei;
3805 profile_probability probability;
3807 last2 = last = expand_gimple_stmt (stmt);
3809 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3810 if (CALL_P (last) && SIBLING_CALL_P (last))
3811 goto found;
3813 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3815 *can_fallthru = true;
3816 return NULL;
3818 found:
3819 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3820 Any instructions emitted here are about to be deleted. */
3821 do_pending_stack_adjust ();
3823 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3824 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3825 EH or abnormal edges, we shouldn't have created a tail call in
3826 the first place. So it seems to me we should just be removing
3827 all edges here, or redirecting the existing fallthru edge to
3828 the exit block. */
3830 probability = profile_probability::never ();
3832 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3834 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3836 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3837 e->dest->count -= e->count ();
3838 probability += e->probability;
3839 remove_edge (e);
3841 else
3842 ei_next (&ei);
3845 /* This is somewhat ugly: the call_expr expander often emits instructions
3846 after the sibcall (to perform the function return). These confuse the
3847 find_many_sub_basic_blocks code, so we need to get rid of these. */
3848 last = NEXT_INSN (last);
3849 gcc_assert (BARRIER_P (last));
3851 *can_fallthru = false;
3852 while (NEXT_INSN (last))
3854 /* For instance an sqrt builtin expander expands if with
3855 sibcall in the then and label for `else`. */
3856 if (LABEL_P (NEXT_INSN (last)))
3858 *can_fallthru = true;
3859 break;
3861 delete_insn (NEXT_INSN (last));
3864 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3865 | EDGE_SIBCALL);
3866 e->probability = probability;
3867 BB_END (bb) = last;
3868 update_bb_for_insn (bb);
3870 if (NEXT_INSN (last))
3872 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3874 last = BB_END (bb);
3875 if (BARRIER_P (last))
3876 BB_END (bb) = PREV_INSN (last);
3879 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3881 return bb;
3884 /* Return the difference between the floor and the truncated result of
3885 a signed division by OP1 with remainder MOD. */
3886 static rtx
3887 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3889 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
3890 return gen_rtx_IF_THEN_ELSE
3891 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3892 gen_rtx_IF_THEN_ELSE
3893 (mode, gen_rtx_LT (BImode,
3894 gen_rtx_DIV (mode, op1, mod),
3895 const0_rtx),
3896 constm1_rtx, const0_rtx),
3897 const0_rtx);
3900 /* Return the difference between the ceil and the truncated result of
3901 a signed division by OP1 with remainder MOD. */
3902 static rtx
3903 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3905 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
3906 return gen_rtx_IF_THEN_ELSE
3907 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3908 gen_rtx_IF_THEN_ELSE
3909 (mode, gen_rtx_GT (BImode,
3910 gen_rtx_DIV (mode, op1, mod),
3911 const0_rtx),
3912 const1_rtx, const0_rtx),
3913 const0_rtx);
3916 /* Return the difference between the ceil and the truncated result of
3917 an unsigned division by OP1 with remainder MOD. */
3918 static rtx
3919 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
3921 /* (mod != 0 ? 1 : 0) */
3922 return gen_rtx_IF_THEN_ELSE
3923 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3924 const1_rtx, const0_rtx);
3927 /* Return the difference between the rounded and the truncated result
3928 of a signed division by OP1 with remainder MOD. Halfway cases are
3929 rounded away from zero, rather than to the nearest even number. */
3930 static rtx
3931 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3933 /* (abs (mod) >= abs (op1) - abs (mod)
3934 ? (op1 / mod > 0 ? 1 : -1)
3935 : 0) */
3936 return gen_rtx_IF_THEN_ELSE
3937 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
3938 gen_rtx_MINUS (mode,
3939 gen_rtx_ABS (mode, op1),
3940 gen_rtx_ABS (mode, mod))),
3941 gen_rtx_IF_THEN_ELSE
3942 (mode, gen_rtx_GT (BImode,
3943 gen_rtx_DIV (mode, op1, mod),
3944 const0_rtx),
3945 const1_rtx, constm1_rtx),
3946 const0_rtx);
3949 /* Return the difference between the rounded and the truncated result
3950 of a unsigned division by OP1 with remainder MOD. Halfway cases
3951 are rounded away from zero, rather than to the nearest even
3952 number. */
3953 static rtx
3954 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
3956 /* (mod >= op1 - mod ? 1 : 0) */
3957 return gen_rtx_IF_THEN_ELSE
3958 (mode, gen_rtx_GE (BImode, mod,
3959 gen_rtx_MINUS (mode, op1, mod)),
3960 const1_rtx, const0_rtx);
3963 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
3964 any rtl. */
3966 static rtx
3967 convert_debug_memory_address (scalar_int_mode mode, rtx x,
3968 addr_space_t as)
3970 #ifndef POINTERS_EXTEND_UNSIGNED
3971 gcc_assert (mode == Pmode
3972 || mode == targetm.addr_space.address_mode (as));
3973 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
3974 #else
3975 rtx temp;
3977 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
3979 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
3980 return x;
3982 /* X must have some form of address mode already. */
3983 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
3984 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
3985 x = lowpart_subreg (mode, x, xmode);
3986 else if (POINTERS_EXTEND_UNSIGNED > 0)
3987 x = gen_rtx_ZERO_EXTEND (mode, x);
3988 else if (!POINTERS_EXTEND_UNSIGNED)
3989 x = gen_rtx_SIGN_EXTEND (mode, x);
3990 else
3992 switch (GET_CODE (x))
3994 case SUBREG:
3995 if ((SUBREG_PROMOTED_VAR_P (x)
3996 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
3997 || (GET_CODE (SUBREG_REG (x)) == PLUS
3998 && REG_P (XEXP (SUBREG_REG (x), 0))
3999 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
4000 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
4001 && GET_MODE (SUBREG_REG (x)) == mode)
4002 return SUBREG_REG (x);
4003 break;
4004 case LABEL_REF:
4005 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4006 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4007 return temp;
4008 case SYMBOL_REF:
4009 temp = shallow_copy_rtx (x);
4010 PUT_MODE (temp, mode);
4011 return temp;
4012 case CONST:
4013 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4014 if (temp)
4015 temp = gen_rtx_CONST (mode, temp);
4016 return temp;
4017 case PLUS:
4018 case MINUS:
4019 if (CONST_INT_P (XEXP (x, 1)))
4021 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4022 if (temp)
4023 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4025 break;
4026 default:
4027 break;
4029 /* Don't know how to express ptr_extend as operation in debug info. */
4030 return NULL;
4032 #endif /* POINTERS_EXTEND_UNSIGNED */
4034 return x;
4037 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4038 by avoid_deep_ter_for_debug. */
4040 static hash_map<tree, tree> *deep_ter_debug_map;
4042 /* Split too deep TER chains for debug stmts using debug temporaries. */
4044 static void
4045 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4047 use_operand_p use_p;
4048 ssa_op_iter iter;
4049 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4051 tree use = USE_FROM_PTR (use_p);
4052 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4053 continue;
4054 gimple *g = get_gimple_for_ssa_name (use);
4055 if (g == NULL)
4056 continue;
4057 if (depth > 6 && !stmt_ends_bb_p (g))
4059 if (deep_ter_debug_map == NULL)
4060 deep_ter_debug_map = new hash_map<tree, tree>;
4062 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4063 if (vexpr != NULL)
4064 continue;
4065 vexpr = make_node (DEBUG_EXPR_DECL);
4066 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4067 DECL_ARTIFICIAL (vexpr) = 1;
4068 TREE_TYPE (vexpr) = TREE_TYPE (use);
4069 SET_DECL_MODE (vexpr, TYPE_MODE (TREE_TYPE (use)));
4070 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4071 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4072 avoid_deep_ter_for_debug (def_temp, 0);
4074 else
4075 avoid_deep_ter_for_debug (g, depth + 1);
4079 /* Return an RTX equivalent to the value of the parameter DECL. */
4081 static rtx
4082 expand_debug_parm_decl (tree decl)
4084 rtx incoming = DECL_INCOMING_RTL (decl);
4086 if (incoming
4087 && GET_MODE (incoming) != BLKmode
4088 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4089 || (MEM_P (incoming)
4090 && REG_P (XEXP (incoming, 0))
4091 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4093 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4095 #ifdef HAVE_window_save
4096 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4097 If the target machine has an explicit window save instruction, the
4098 actual entry value is the corresponding OUTGOING_REGNO instead. */
4099 if (REG_P (incoming)
4100 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4101 incoming
4102 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4103 OUTGOING_REGNO (REGNO (incoming)), 0);
4104 else if (MEM_P (incoming))
4106 rtx reg = XEXP (incoming, 0);
4107 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4109 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4110 incoming = replace_equiv_address_nv (incoming, reg);
4112 else
4113 incoming = copy_rtx (incoming);
4115 #endif
4117 ENTRY_VALUE_EXP (rtl) = incoming;
4118 return rtl;
4121 if (incoming
4122 && GET_MODE (incoming) != BLKmode
4123 && !TREE_ADDRESSABLE (decl)
4124 && MEM_P (incoming)
4125 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4126 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4127 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4128 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4129 return copy_rtx (incoming);
4131 return NULL_RTX;
4134 /* Return an RTX equivalent to the value of the tree expression EXP. */
4136 static rtx
4137 expand_debug_expr (tree exp)
4139 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4140 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4141 machine_mode inner_mode = VOIDmode;
4142 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4143 addr_space_t as;
4144 scalar_int_mode op0_mode, op1_mode, addr_mode;
4146 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4148 case tcc_expression:
4149 switch (TREE_CODE (exp))
4151 case COND_EXPR:
4152 case DOT_PROD_EXPR:
4153 case SAD_EXPR:
4154 case WIDEN_MULT_PLUS_EXPR:
4155 case WIDEN_MULT_MINUS_EXPR:
4156 goto ternary;
4158 case TRUTH_ANDIF_EXPR:
4159 case TRUTH_ORIF_EXPR:
4160 case TRUTH_AND_EXPR:
4161 case TRUTH_OR_EXPR:
4162 case TRUTH_XOR_EXPR:
4163 goto binary;
4165 case TRUTH_NOT_EXPR:
4166 goto unary;
4168 default:
4169 break;
4171 break;
4173 ternary:
4174 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4175 if (!op2)
4176 return NULL_RTX;
4177 /* Fall through. */
4179 binary:
4180 case tcc_binary:
4181 if (mode == BLKmode)
4182 return NULL_RTX;
4183 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4184 if (!op1)
4185 return NULL_RTX;
4186 switch (TREE_CODE (exp))
4188 case LSHIFT_EXPR:
4189 case RSHIFT_EXPR:
4190 case LROTATE_EXPR:
4191 case RROTATE_EXPR:
4192 case WIDEN_LSHIFT_EXPR:
4193 /* Ensure second operand isn't wider than the first one. */
4194 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4195 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4196 && (GET_MODE_UNIT_PRECISION (mode)
4197 < GET_MODE_PRECISION (op1_mode)))
4198 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4199 break;
4200 default:
4201 break;
4203 /* Fall through. */
4205 unary:
4206 case tcc_unary:
4207 if (mode == BLKmode)
4208 return NULL_RTX;
4209 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4210 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4211 if (!op0)
4212 return NULL_RTX;
4213 break;
4215 case tcc_comparison:
4216 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4217 goto binary;
4219 case tcc_type:
4220 case tcc_statement:
4221 gcc_unreachable ();
4223 case tcc_constant:
4224 case tcc_exceptional:
4225 case tcc_declaration:
4226 case tcc_reference:
4227 case tcc_vl_exp:
4228 break;
4231 switch (TREE_CODE (exp))
4233 case STRING_CST:
4234 if (!lookup_constant_def (exp))
4236 if (strlen (TREE_STRING_POINTER (exp)) + 1
4237 != (size_t) TREE_STRING_LENGTH (exp))
4238 return NULL_RTX;
4239 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4240 op0 = gen_rtx_MEM (BLKmode, op0);
4241 set_mem_attributes (op0, exp, 0);
4242 return op0;
4244 /* Fall through. */
4246 case INTEGER_CST:
4247 case REAL_CST:
4248 case FIXED_CST:
4249 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4250 return op0;
4252 case POLY_INT_CST:
4253 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4255 case COMPLEX_CST:
4256 gcc_assert (COMPLEX_MODE_P (mode));
4257 op0 = expand_debug_expr (TREE_REALPART (exp));
4258 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4259 return gen_rtx_CONCAT (mode, op0, op1);
4261 case DEBUG_EXPR_DECL:
4262 op0 = DECL_RTL_IF_SET (exp);
4264 if (op0)
4265 return op0;
4267 op0 = gen_rtx_DEBUG_EXPR (mode);
4268 DEBUG_EXPR_TREE_DECL (op0) = exp;
4269 SET_DECL_RTL (exp, op0);
4271 return op0;
4273 case VAR_DECL:
4274 case PARM_DECL:
4275 case FUNCTION_DECL:
4276 case LABEL_DECL:
4277 case CONST_DECL:
4278 case RESULT_DECL:
4279 op0 = DECL_RTL_IF_SET (exp);
4281 /* This decl was probably optimized away. */
4282 if (!op0)
4284 if (!VAR_P (exp)
4285 || DECL_EXTERNAL (exp)
4286 || !TREE_STATIC (exp)
4287 || !DECL_NAME (exp)
4288 || DECL_HARD_REGISTER (exp)
4289 || DECL_IN_CONSTANT_POOL (exp)
4290 || mode == VOIDmode)
4291 return NULL;
4293 op0 = make_decl_rtl_for_debug (exp);
4294 if (!MEM_P (op0)
4295 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4296 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4297 return NULL;
4299 else
4300 op0 = copy_rtx (op0);
4302 if (GET_MODE (op0) == BLKmode
4303 /* If op0 is not BLKmode, but mode is, adjust_mode
4304 below would ICE. While it is likely a FE bug,
4305 try to be robust here. See PR43166. */
4306 || mode == BLKmode
4307 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4309 gcc_assert (MEM_P (op0));
4310 op0 = adjust_address_nv (op0, mode, 0);
4311 return op0;
4314 /* Fall through. */
4316 adjust_mode:
4317 case PAREN_EXPR:
4318 CASE_CONVERT:
4320 inner_mode = GET_MODE (op0);
4322 if (mode == inner_mode)
4323 return op0;
4325 if (inner_mode == VOIDmode)
4327 if (TREE_CODE (exp) == SSA_NAME)
4328 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4329 else
4330 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4331 if (mode == inner_mode)
4332 return op0;
4335 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4337 if (GET_MODE_UNIT_BITSIZE (mode)
4338 == GET_MODE_UNIT_BITSIZE (inner_mode))
4339 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4340 else if (GET_MODE_UNIT_BITSIZE (mode)
4341 < GET_MODE_UNIT_BITSIZE (inner_mode))
4342 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4343 else
4344 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4346 else if (FLOAT_MODE_P (mode))
4348 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4349 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4350 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4351 else
4352 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4354 else if (FLOAT_MODE_P (inner_mode))
4356 if (unsignedp)
4357 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4358 else
4359 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4361 else if (GET_MODE_UNIT_PRECISION (mode)
4362 == GET_MODE_UNIT_PRECISION (inner_mode))
4363 op0 = lowpart_subreg (mode, op0, inner_mode);
4364 else if (GET_MODE_UNIT_PRECISION (mode)
4365 < GET_MODE_UNIT_PRECISION (inner_mode))
4366 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4367 else if (UNARY_CLASS_P (exp)
4368 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4369 : unsignedp)
4370 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4371 else
4372 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4374 return op0;
4377 case MEM_REF:
4378 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4380 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4381 TREE_OPERAND (exp, 0),
4382 TREE_OPERAND (exp, 1));
4383 if (newexp)
4384 return expand_debug_expr (newexp);
4386 /* FALLTHROUGH */
4387 case INDIRECT_REF:
4388 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4389 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4390 if (!op0)
4391 return NULL;
4393 if (TREE_CODE (exp) == MEM_REF)
4395 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4396 || (GET_CODE (op0) == PLUS
4397 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4398 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4399 Instead just use get_inner_reference. */
4400 goto component_ref;
4402 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4403 poly_int64 offset;
4404 if (!op1 || !poly_int_rtx_p (op1, &offset))
4405 return NULL;
4407 op0 = plus_constant (inner_mode, op0, offset);
4410 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4412 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4413 op0, as);
4414 if (op0 == NULL_RTX)
4415 return NULL;
4417 op0 = gen_rtx_MEM (mode, op0);
4418 set_mem_attributes (op0, exp, 0);
4419 if (TREE_CODE (exp) == MEM_REF
4420 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4421 set_mem_expr (op0, NULL_TREE);
4422 set_mem_addr_space (op0, as);
4424 return op0;
4426 case TARGET_MEM_REF:
4427 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4428 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4429 return NULL;
4431 op0 = expand_debug_expr
4432 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4433 if (!op0)
4434 return NULL;
4436 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4437 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4438 op0, as);
4439 if (op0 == NULL_RTX)
4440 return NULL;
4442 op0 = gen_rtx_MEM (mode, op0);
4444 set_mem_attributes (op0, exp, 0);
4445 set_mem_addr_space (op0, as);
4447 return op0;
4449 component_ref:
4450 case ARRAY_REF:
4451 case ARRAY_RANGE_REF:
4452 case COMPONENT_REF:
4453 case BIT_FIELD_REF:
4454 case REALPART_EXPR:
4455 case IMAGPART_EXPR:
4456 case VIEW_CONVERT_EXPR:
4458 machine_mode mode1;
4459 poly_int64 bitsize, bitpos;
4460 tree offset;
4461 int reversep, volatilep = 0;
4462 tree tem
4463 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4464 &unsignedp, &reversep, &volatilep);
4465 rtx orig_op0;
4467 if (known_eq (bitsize, 0))
4468 return NULL;
4470 orig_op0 = op0 = expand_debug_expr (tem);
4472 if (!op0)
4473 return NULL;
4475 if (offset)
4477 machine_mode addrmode, offmode;
4479 if (!MEM_P (op0))
4480 return NULL;
4482 op0 = XEXP (op0, 0);
4483 addrmode = GET_MODE (op0);
4484 if (addrmode == VOIDmode)
4485 addrmode = Pmode;
4487 op1 = expand_debug_expr (offset);
4488 if (!op1)
4489 return NULL;
4491 offmode = GET_MODE (op1);
4492 if (offmode == VOIDmode)
4493 offmode = TYPE_MODE (TREE_TYPE (offset));
4495 if (addrmode != offmode)
4496 op1 = lowpart_subreg (addrmode, op1, offmode);
4498 /* Don't use offset_address here, we don't need a
4499 recognizable address, and we don't want to generate
4500 code. */
4501 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4502 op0, op1));
4505 if (MEM_P (op0))
4507 if (mode1 == VOIDmode)
4509 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4510 return NULL;
4511 /* Bitfield. */
4512 mode1 = smallest_int_mode_for_size (bitsize);
4514 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4515 if (maybe_ne (bytepos, 0))
4517 op0 = adjust_address_nv (op0, mode1, bytepos);
4518 bitpos = num_trailing_bits (bitpos);
4520 else if (known_eq (bitpos, 0)
4521 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4522 op0 = adjust_address_nv (op0, mode, 0);
4523 else if (GET_MODE (op0) != mode1)
4524 op0 = adjust_address_nv (op0, mode1, 0);
4525 else
4526 op0 = copy_rtx (op0);
4527 if (op0 == orig_op0)
4528 op0 = shallow_copy_rtx (op0);
4529 set_mem_attributes (op0, exp, 0);
4532 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4533 return op0;
4535 if (maybe_lt (bitpos, 0))
4536 return NULL;
4538 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4539 return NULL;
4541 poly_int64 bytepos;
4542 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4543 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4545 machine_mode opmode = GET_MODE (op0);
4547 if (opmode == VOIDmode)
4548 opmode = TYPE_MODE (TREE_TYPE (tem));
4550 /* This condition may hold if we're expanding the address
4551 right past the end of an array that turned out not to
4552 be addressable (i.e., the address was only computed in
4553 debug stmts). The gen_subreg below would rightfully
4554 crash, and the address doesn't really exist, so just
4555 drop it. */
4556 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4557 return NULL;
4559 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4560 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4563 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4564 && TYPE_UNSIGNED (TREE_TYPE (exp))
4565 ? SIGN_EXTRACT
4566 : ZERO_EXTRACT, mode,
4567 GET_MODE (op0) != VOIDmode
4568 ? GET_MODE (op0)
4569 : TYPE_MODE (TREE_TYPE (tem)),
4570 op0, gen_int_mode (bitsize, word_mode),
4571 gen_int_mode (bitpos, word_mode));
4574 case ABS_EXPR:
4575 case ABSU_EXPR:
4576 return simplify_gen_unary (ABS, mode, op0, mode);
4578 case NEGATE_EXPR:
4579 return simplify_gen_unary (NEG, mode, op0, mode);
4581 case BIT_NOT_EXPR:
4582 return simplify_gen_unary (NOT, mode, op0, mode);
4584 case FLOAT_EXPR:
4585 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4586 0)))
4587 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4588 inner_mode);
4590 case FIX_TRUNC_EXPR:
4591 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4592 inner_mode);
4594 case POINTER_PLUS_EXPR:
4595 /* For the rare target where pointers are not the same size as
4596 size_t, we need to check for mis-matched modes and correct
4597 the addend. */
4598 if (op0 && op1
4599 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4600 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4601 && op0_mode != op1_mode)
4603 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4604 /* If OP0 is a partial mode, then we must truncate, even
4605 if it has the same bitsize as OP1 as GCC's
4606 representation of partial modes is opaque. */
4607 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4608 && (GET_MODE_BITSIZE (op0_mode)
4609 == GET_MODE_BITSIZE (op1_mode))))
4610 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4611 else
4612 /* We always sign-extend, regardless of the signedness of
4613 the operand, because the operand is always unsigned
4614 here even if the original C expression is signed. */
4615 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4617 /* Fall through. */
4618 case PLUS_EXPR:
4619 return simplify_gen_binary (PLUS, mode, op0, op1);
4621 case MINUS_EXPR:
4622 case POINTER_DIFF_EXPR:
4623 return simplify_gen_binary (MINUS, mode, op0, op1);
4625 case MULT_EXPR:
4626 return simplify_gen_binary (MULT, mode, op0, op1);
4628 case RDIV_EXPR:
4629 case TRUNC_DIV_EXPR:
4630 case EXACT_DIV_EXPR:
4631 if (unsignedp)
4632 return simplify_gen_binary (UDIV, mode, op0, op1);
4633 else
4634 return simplify_gen_binary (DIV, mode, op0, op1);
4636 case TRUNC_MOD_EXPR:
4637 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4639 case FLOOR_DIV_EXPR:
4640 if (unsignedp)
4641 return simplify_gen_binary (UDIV, mode, op0, op1);
4642 else
4644 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4645 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4646 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4647 return simplify_gen_binary (PLUS, mode, div, adj);
4650 case FLOOR_MOD_EXPR:
4651 if (unsignedp)
4652 return simplify_gen_binary (UMOD, mode, op0, op1);
4653 else
4655 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4656 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4657 adj = simplify_gen_unary (NEG, mode,
4658 simplify_gen_binary (MULT, mode, adj, op1),
4659 mode);
4660 return simplify_gen_binary (PLUS, mode, mod, adj);
4663 case CEIL_DIV_EXPR:
4664 if (unsignedp)
4666 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4667 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4668 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4669 return simplify_gen_binary (PLUS, mode, div, adj);
4671 else
4673 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4674 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4675 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4676 return simplify_gen_binary (PLUS, mode, div, adj);
4679 case CEIL_MOD_EXPR:
4680 if (unsignedp)
4682 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4683 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4684 adj = simplify_gen_unary (NEG, mode,
4685 simplify_gen_binary (MULT, mode, adj, op1),
4686 mode);
4687 return simplify_gen_binary (PLUS, mode, mod, adj);
4689 else
4691 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4692 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4693 adj = simplify_gen_unary (NEG, mode,
4694 simplify_gen_binary (MULT, mode, adj, op1),
4695 mode);
4696 return simplify_gen_binary (PLUS, mode, mod, adj);
4699 case ROUND_DIV_EXPR:
4700 if (unsignedp)
4702 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4703 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4704 rtx adj = round_udiv_adjust (mode, mod, op1);
4705 return simplify_gen_binary (PLUS, mode, div, adj);
4707 else
4709 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4710 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4711 rtx adj = round_sdiv_adjust (mode, mod, op1);
4712 return simplify_gen_binary (PLUS, mode, div, adj);
4715 case ROUND_MOD_EXPR:
4716 if (unsignedp)
4718 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4719 rtx adj = round_udiv_adjust (mode, mod, op1);
4720 adj = simplify_gen_unary (NEG, mode,
4721 simplify_gen_binary (MULT, mode, adj, op1),
4722 mode);
4723 return simplify_gen_binary (PLUS, mode, mod, adj);
4725 else
4727 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4728 rtx adj = round_sdiv_adjust (mode, mod, op1);
4729 adj = simplify_gen_unary (NEG, mode,
4730 simplify_gen_binary (MULT, mode, adj, op1),
4731 mode);
4732 return simplify_gen_binary (PLUS, mode, mod, adj);
4735 case LSHIFT_EXPR:
4736 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4738 case RSHIFT_EXPR:
4739 if (unsignedp)
4740 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4741 else
4742 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4744 case LROTATE_EXPR:
4745 return simplify_gen_binary (ROTATE, mode, op0, op1);
4747 case RROTATE_EXPR:
4748 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4750 case MIN_EXPR:
4751 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4753 case MAX_EXPR:
4754 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4756 case BIT_AND_EXPR:
4757 case TRUTH_AND_EXPR:
4758 return simplify_gen_binary (AND, mode, op0, op1);
4760 case BIT_IOR_EXPR:
4761 case TRUTH_OR_EXPR:
4762 return simplify_gen_binary (IOR, mode, op0, op1);
4764 case BIT_XOR_EXPR:
4765 case TRUTH_XOR_EXPR:
4766 return simplify_gen_binary (XOR, mode, op0, op1);
4768 case TRUTH_ANDIF_EXPR:
4769 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4771 case TRUTH_ORIF_EXPR:
4772 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4774 case TRUTH_NOT_EXPR:
4775 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4777 case LT_EXPR:
4778 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4779 op0, op1);
4781 case LE_EXPR:
4782 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4783 op0, op1);
4785 case GT_EXPR:
4786 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4787 op0, op1);
4789 case GE_EXPR:
4790 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4791 op0, op1);
4793 case EQ_EXPR:
4794 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4796 case NE_EXPR:
4797 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4799 case UNORDERED_EXPR:
4800 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4802 case ORDERED_EXPR:
4803 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4805 case UNLT_EXPR:
4806 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4808 case UNLE_EXPR:
4809 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4811 case UNGT_EXPR:
4812 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4814 case UNGE_EXPR:
4815 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4817 case UNEQ_EXPR:
4818 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4820 case LTGT_EXPR:
4821 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4823 case COND_EXPR:
4824 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4826 case COMPLEX_EXPR:
4827 gcc_assert (COMPLEX_MODE_P (mode));
4828 if (GET_MODE (op0) == VOIDmode)
4829 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4830 if (GET_MODE (op1) == VOIDmode)
4831 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4832 return gen_rtx_CONCAT (mode, op0, op1);
4834 case CONJ_EXPR:
4835 if (GET_CODE (op0) == CONCAT)
4836 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4837 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4838 XEXP (op0, 1),
4839 GET_MODE_INNER (mode)));
4840 else
4842 scalar_mode imode = GET_MODE_INNER (mode);
4843 rtx re, im;
4845 if (MEM_P (op0))
4847 re = adjust_address_nv (op0, imode, 0);
4848 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4850 else
4852 scalar_int_mode ifmode;
4853 scalar_int_mode ihmode;
4854 rtx halfsize;
4855 if (!int_mode_for_mode (mode).exists (&ifmode)
4856 || !int_mode_for_mode (imode).exists (&ihmode))
4857 return NULL;
4858 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4859 re = op0;
4860 if (mode != ifmode)
4861 re = gen_rtx_SUBREG (ifmode, re, 0);
4862 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4863 if (imode != ihmode)
4864 re = gen_rtx_SUBREG (imode, re, 0);
4865 im = copy_rtx (op0);
4866 if (mode != ifmode)
4867 im = gen_rtx_SUBREG (ifmode, im, 0);
4868 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4869 if (imode != ihmode)
4870 im = gen_rtx_SUBREG (imode, im, 0);
4872 im = gen_rtx_NEG (imode, im);
4873 return gen_rtx_CONCAT (mode, re, im);
4876 case ADDR_EXPR:
4877 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4878 if (!op0 || !MEM_P (op0))
4880 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
4881 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
4882 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
4883 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
4884 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
4885 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
4887 if (handled_component_p (TREE_OPERAND (exp, 0)))
4889 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
4890 bool reverse;
4891 tree decl
4892 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
4893 &bitsize, &maxsize, &reverse);
4894 if ((VAR_P (decl)
4895 || TREE_CODE (decl) == PARM_DECL
4896 || TREE_CODE (decl) == RESULT_DECL)
4897 && (!TREE_ADDRESSABLE (decl)
4898 || target_for_debug_bind (decl))
4899 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
4900 && known_gt (bitsize, 0)
4901 && known_eq (bitsize, maxsize))
4903 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
4904 return plus_constant (mode, base, byteoffset);
4908 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
4909 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
4910 == ADDR_EXPR)
4912 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4913 0));
4914 if (op0 != NULL
4915 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4916 || (GET_CODE (op0) == PLUS
4917 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
4918 && CONST_INT_P (XEXP (op0, 1)))))
4920 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4921 1));
4922 poly_int64 offset;
4923 if (!op1 || !poly_int_rtx_p (op1, &offset))
4924 return NULL;
4926 return plus_constant (mode, op0, offset);
4930 return NULL;
4933 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
4934 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
4935 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
4937 return op0;
4939 case VECTOR_CST:
4941 unsigned HOST_WIDE_INT i, nelts;
4943 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
4944 return NULL;
4946 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
4948 for (i = 0; i < nelts; ++i)
4950 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
4951 if (!op1)
4952 return NULL;
4953 XVECEXP (op0, 0, i) = op1;
4956 return op0;
4959 case CONSTRUCTOR:
4960 if (TREE_CLOBBER_P (exp))
4961 return NULL;
4962 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
4964 unsigned i;
4965 unsigned HOST_WIDE_INT nelts;
4966 tree val;
4968 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
4969 goto flag_unsupported;
4971 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
4973 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
4975 op1 = expand_debug_expr (val);
4976 if (!op1)
4977 return NULL;
4978 XVECEXP (op0, 0, i) = op1;
4981 if (i < nelts)
4983 op1 = expand_debug_expr
4984 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
4986 if (!op1)
4987 return NULL;
4989 for (; i < nelts; i++)
4990 XVECEXP (op0, 0, i) = op1;
4993 return op0;
4995 else
4996 goto flag_unsupported;
4998 case CALL_EXPR:
4999 /* ??? Maybe handle some builtins? */
5000 return NULL;
5002 case SSA_NAME:
5004 gimple *g = get_gimple_for_ssa_name (exp);
5005 if (g)
5007 tree t = NULL_TREE;
5008 if (deep_ter_debug_map)
5010 tree *slot = deep_ter_debug_map->get (exp);
5011 if (slot)
5012 t = *slot;
5014 if (t == NULL_TREE)
5015 t = gimple_assign_rhs_to_tree (g);
5016 op0 = expand_debug_expr (t);
5017 if (!op0)
5018 return NULL;
5020 else
5022 /* If this is a reference to an incoming value of
5023 parameter that is never used in the code or where the
5024 incoming value is never used in the code, use
5025 PARM_DECL's DECL_RTL if set. */
5026 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5027 && SSA_NAME_VAR (exp)
5028 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5029 && has_zero_uses (exp))
5031 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5032 if (op0)
5033 goto adjust_mode;
5034 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5035 if (op0)
5036 goto adjust_mode;
5039 int part = var_to_partition (SA.map, exp);
5041 if (part == NO_PARTITION)
5042 return NULL;
5044 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5046 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5048 goto adjust_mode;
5051 case ERROR_MARK:
5052 return NULL;
5054 /* Vector stuff. For most of the codes we don't have rtl codes. */
5055 case REALIGN_LOAD_EXPR:
5056 case VEC_COND_EXPR:
5057 case VEC_PACK_FIX_TRUNC_EXPR:
5058 case VEC_PACK_FLOAT_EXPR:
5059 case VEC_PACK_SAT_EXPR:
5060 case VEC_PACK_TRUNC_EXPR:
5061 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5062 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5063 case VEC_UNPACK_FLOAT_HI_EXPR:
5064 case VEC_UNPACK_FLOAT_LO_EXPR:
5065 case VEC_UNPACK_HI_EXPR:
5066 case VEC_UNPACK_LO_EXPR:
5067 case VEC_WIDEN_MULT_HI_EXPR:
5068 case VEC_WIDEN_MULT_LO_EXPR:
5069 case VEC_WIDEN_MULT_EVEN_EXPR:
5070 case VEC_WIDEN_MULT_ODD_EXPR:
5071 case VEC_WIDEN_LSHIFT_HI_EXPR:
5072 case VEC_WIDEN_LSHIFT_LO_EXPR:
5073 case VEC_PERM_EXPR:
5074 case VEC_DUPLICATE_EXPR:
5075 case VEC_SERIES_EXPR:
5076 return NULL;
5078 /* Misc codes. */
5079 case ADDR_SPACE_CONVERT_EXPR:
5080 case FIXED_CONVERT_EXPR:
5081 case OBJ_TYPE_REF:
5082 case WITH_SIZE_EXPR:
5083 case BIT_INSERT_EXPR:
5084 return NULL;
5086 case DOT_PROD_EXPR:
5087 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5088 && SCALAR_INT_MODE_P (mode))
5091 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5092 0)))
5093 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5094 inner_mode);
5096 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5097 1)))
5098 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5099 inner_mode);
5100 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5101 return simplify_gen_binary (PLUS, mode, op0, op2);
5103 return NULL;
5105 case WIDEN_MULT_EXPR:
5106 case WIDEN_MULT_PLUS_EXPR:
5107 case WIDEN_MULT_MINUS_EXPR:
5108 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5109 && SCALAR_INT_MODE_P (mode))
5111 inner_mode = GET_MODE (op0);
5112 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5113 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5114 else
5115 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5116 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5117 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5118 else
5119 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5120 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5121 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5122 return op0;
5123 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5124 return simplify_gen_binary (PLUS, mode, op0, op2);
5125 else
5126 return simplify_gen_binary (MINUS, mode, op2, op0);
5128 return NULL;
5130 case MULT_HIGHPART_EXPR:
5131 /* ??? Similar to the above. */
5132 return NULL;
5134 case WIDEN_SUM_EXPR:
5135 case WIDEN_LSHIFT_EXPR:
5136 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5137 && SCALAR_INT_MODE_P (mode))
5140 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5141 0)))
5142 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5143 inner_mode);
5144 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5145 ? ASHIFT : PLUS, mode, op0, op1);
5147 return NULL;
5149 default:
5150 flag_unsupported:
5151 if (flag_checking)
5153 debug_tree (exp);
5154 gcc_unreachable ();
5156 return NULL;
5160 /* Return an RTX equivalent to the source bind value of the tree expression
5161 EXP. */
5163 static rtx
5164 expand_debug_source_expr (tree exp)
5166 rtx op0 = NULL_RTX;
5167 machine_mode mode = VOIDmode, inner_mode;
5169 switch (TREE_CODE (exp))
5171 case VAR_DECL:
5172 if (DECL_ABSTRACT_ORIGIN (exp))
5173 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5174 break;
5175 case PARM_DECL:
5177 mode = DECL_MODE (exp);
5178 op0 = expand_debug_parm_decl (exp);
5179 if (op0)
5180 break;
5181 /* See if this isn't an argument that has been completely
5182 optimized out. */
5183 if (!DECL_RTL_SET_P (exp)
5184 && !DECL_INCOMING_RTL (exp)
5185 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5187 tree aexp = DECL_ORIGIN (exp);
5188 if (DECL_CONTEXT (aexp)
5189 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5191 vec<tree, va_gc> **debug_args;
5192 unsigned int ix;
5193 tree ddecl;
5194 debug_args = decl_debug_args_lookup (current_function_decl);
5195 if (debug_args != NULL)
5197 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5198 ix += 2)
5199 if (ddecl == aexp)
5200 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5204 break;
5206 default:
5207 break;
5210 if (op0 == NULL_RTX)
5211 return NULL_RTX;
5213 inner_mode = GET_MODE (op0);
5214 if (mode == inner_mode)
5215 return op0;
5217 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5219 if (GET_MODE_UNIT_BITSIZE (mode)
5220 == GET_MODE_UNIT_BITSIZE (inner_mode))
5221 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5222 else if (GET_MODE_UNIT_BITSIZE (mode)
5223 < GET_MODE_UNIT_BITSIZE (inner_mode))
5224 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5225 else
5226 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5228 else if (FLOAT_MODE_P (mode))
5229 gcc_unreachable ();
5230 else if (FLOAT_MODE_P (inner_mode))
5232 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5233 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5234 else
5235 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5237 else if (GET_MODE_UNIT_PRECISION (mode)
5238 == GET_MODE_UNIT_PRECISION (inner_mode))
5239 op0 = lowpart_subreg (mode, op0, inner_mode);
5240 else if (GET_MODE_UNIT_PRECISION (mode)
5241 < GET_MODE_UNIT_PRECISION (inner_mode))
5242 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5243 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5244 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5245 else
5246 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5248 return op0;
5251 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5252 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5253 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5255 static void
5256 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5258 rtx exp = *exp_p;
5260 if (exp == NULL_RTX)
5261 return;
5263 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5264 return;
5266 if (depth == 4)
5268 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5269 rtx dval = make_debug_expr_from_rtl (exp);
5271 /* Emit a debug bind insn before INSN. */
5272 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5273 DEBUG_EXPR_TREE_DECL (dval), exp,
5274 VAR_INIT_STATUS_INITIALIZED);
5276 emit_debug_insn_before (bind, insn);
5277 *exp_p = dval;
5278 return;
5281 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5282 int i, j;
5283 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5284 switch (*format_ptr++)
5286 case 'e':
5287 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5288 break;
5290 case 'E':
5291 case 'V':
5292 for (j = 0; j < XVECLEN (exp, i); j++)
5293 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5294 break;
5296 default:
5297 break;
5301 /* Expand the _LOCs in debug insns. We run this after expanding all
5302 regular insns, so that any variables referenced in the function
5303 will have their DECL_RTLs set. */
5305 static void
5306 expand_debug_locations (void)
5308 rtx_insn *insn;
5309 rtx_insn *last = get_last_insn ();
5310 int save_strict_alias = flag_strict_aliasing;
5312 /* New alias sets while setting up memory attributes cause
5313 -fcompare-debug failures, even though it doesn't bring about any
5314 codegen changes. */
5315 flag_strict_aliasing = 0;
5317 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5318 if (DEBUG_BIND_INSN_P (insn))
5320 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5321 rtx val;
5322 rtx_insn *prev_insn, *insn2;
5323 machine_mode mode;
5325 if (value == NULL_TREE)
5326 val = NULL_RTX;
5327 else
5329 if (INSN_VAR_LOCATION_STATUS (insn)
5330 == VAR_INIT_STATUS_UNINITIALIZED)
5331 val = expand_debug_source_expr (value);
5332 /* The avoid_deep_ter_for_debug function inserts
5333 debug bind stmts after SSA_NAME definition, with the
5334 SSA_NAME as the whole bind location. Disable temporarily
5335 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5336 being defined in this DEBUG_INSN. */
5337 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5339 tree *slot = deep_ter_debug_map->get (value);
5340 if (slot)
5342 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5343 *slot = NULL_TREE;
5344 else
5345 slot = NULL;
5347 val = expand_debug_expr (value);
5348 if (slot)
5349 *slot = INSN_VAR_LOCATION_DECL (insn);
5351 else
5352 val = expand_debug_expr (value);
5353 gcc_assert (last == get_last_insn ());
5356 if (!val)
5357 val = gen_rtx_UNKNOWN_VAR_LOC ();
5358 else
5360 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5362 gcc_assert (mode == GET_MODE (val)
5363 || (GET_MODE (val) == VOIDmode
5364 && (CONST_SCALAR_INT_P (val)
5365 || GET_CODE (val) == CONST_FIXED
5366 || GET_CODE (val) == LABEL_REF)));
5369 INSN_VAR_LOCATION_LOC (insn) = val;
5370 prev_insn = PREV_INSN (insn);
5371 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5372 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5375 flag_strict_aliasing = save_strict_alias;
5378 /* Performs swapping operands of commutative operations to expand
5379 the expensive one first. */
5381 static void
5382 reorder_operands (basic_block bb)
5384 unsigned int *lattice; /* Hold cost of each statement. */
5385 unsigned int i = 0, n = 0;
5386 gimple_stmt_iterator gsi;
5387 gimple_seq stmts;
5388 gimple *stmt;
5389 bool swap;
5390 tree op0, op1;
5391 ssa_op_iter iter;
5392 use_operand_p use_p;
5393 gimple *def0, *def1;
5395 /* Compute cost of each statement using estimate_num_insns. */
5396 stmts = bb_seq (bb);
5397 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5399 stmt = gsi_stmt (gsi);
5400 if (!is_gimple_debug (stmt))
5401 gimple_set_uid (stmt, n++);
5403 lattice = XNEWVEC (unsigned int, n);
5404 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5406 unsigned cost;
5407 stmt = gsi_stmt (gsi);
5408 if (is_gimple_debug (stmt))
5409 continue;
5410 cost = estimate_num_insns (stmt, &eni_size_weights);
5411 lattice[i] = cost;
5412 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5414 tree use = USE_FROM_PTR (use_p);
5415 gimple *def_stmt;
5416 if (TREE_CODE (use) != SSA_NAME)
5417 continue;
5418 def_stmt = get_gimple_for_ssa_name (use);
5419 if (!def_stmt)
5420 continue;
5421 lattice[i] += lattice[gimple_uid (def_stmt)];
5423 i++;
5424 if (!is_gimple_assign (stmt)
5425 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5426 continue;
5427 op0 = gimple_op (stmt, 1);
5428 op1 = gimple_op (stmt, 2);
5429 if (TREE_CODE (op0) != SSA_NAME
5430 || TREE_CODE (op1) != SSA_NAME)
5431 continue;
5432 /* Swap operands if the second one is more expensive. */
5433 def0 = get_gimple_for_ssa_name (op0);
5434 def1 = get_gimple_for_ssa_name (op1);
5435 if (!def1)
5436 continue;
5437 swap = false;
5438 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5439 swap = true;
5440 if (swap)
5442 if (dump_file && (dump_flags & TDF_DETAILS))
5444 fprintf (dump_file, "Swap operands in stmt:\n");
5445 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5446 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5447 def0 ? lattice[gimple_uid (def0)] : 0,
5448 lattice[gimple_uid (def1)]);
5450 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5451 gimple_assign_rhs2_ptr (stmt));
5454 XDELETE (lattice);
5457 /* Expand basic block BB from GIMPLE trees to RTL. */
5459 static basic_block
5460 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5462 gimple_stmt_iterator gsi;
5463 gimple_seq stmts;
5464 gimple *stmt = NULL;
5465 rtx_note *note = NULL;
5466 rtx_insn *last;
5467 edge e;
5468 edge_iterator ei;
5470 if (dump_file)
5471 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5472 bb->index);
5474 /* Note that since we are now transitioning from GIMPLE to RTL, we
5475 cannot use the gsi_*_bb() routines because they expect the basic
5476 block to be in GIMPLE, instead of RTL. Therefore, we need to
5477 access the BB sequence directly. */
5478 if (optimize)
5479 reorder_operands (bb);
5480 stmts = bb_seq (bb);
5481 bb->il.gimple.seq = NULL;
5482 bb->il.gimple.phi_nodes = NULL;
5483 rtl_profile_for_bb (bb);
5484 init_rtl_bb_info (bb);
5485 bb->flags |= BB_RTL;
5487 /* Remove the RETURN_EXPR if we may fall though to the exit
5488 instead. */
5489 gsi = gsi_last (stmts);
5490 if (!gsi_end_p (gsi)
5491 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5493 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5495 gcc_assert (single_succ_p (bb));
5496 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5498 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5499 && !gimple_return_retval (ret_stmt))
5501 gsi_remove (&gsi, false);
5502 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5506 gsi = gsi_start (stmts);
5507 if (!gsi_end_p (gsi))
5509 stmt = gsi_stmt (gsi);
5510 if (gimple_code (stmt) != GIMPLE_LABEL)
5511 stmt = NULL;
5514 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5516 if (stmt || elt)
5518 gcc_checking_assert (!note);
5519 last = get_last_insn ();
5521 if (stmt)
5523 expand_gimple_stmt (stmt);
5524 gsi_next (&gsi);
5527 if (elt)
5528 emit_label (*elt);
5530 BB_HEAD (bb) = NEXT_INSN (last);
5531 if (NOTE_P (BB_HEAD (bb)))
5532 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5533 gcc_assert (LABEL_P (BB_HEAD (bb)));
5534 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5536 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5538 else
5539 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5541 if (note)
5542 NOTE_BASIC_BLOCK (note) = bb;
5544 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5546 basic_block new_bb;
5548 stmt = gsi_stmt (gsi);
5550 /* If this statement is a non-debug one, and we generate debug
5551 insns, then this one might be the last real use of a TERed
5552 SSA_NAME, but where there are still some debug uses further
5553 down. Expanding the current SSA name in such further debug
5554 uses by their RHS might lead to wrong debug info, as coalescing
5555 might make the operands of such RHS be placed into the same
5556 pseudo as something else. Like so:
5557 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5558 use(a_1);
5559 a_2 = ...
5560 #DEBUG ... => a_1
5561 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5562 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5563 the write to a_2 would actually have clobbered the place which
5564 formerly held a_0.
5566 So, instead of that, we recognize the situation, and generate
5567 debug temporaries at the last real use of TERed SSA names:
5568 a_1 = a_0 + 1;
5569 #DEBUG #D1 => a_1
5570 use(a_1);
5571 a_2 = ...
5572 #DEBUG ... => #D1
5574 if (MAY_HAVE_DEBUG_BIND_INSNS
5575 && SA.values
5576 && !is_gimple_debug (stmt))
5578 ssa_op_iter iter;
5579 tree op;
5580 gimple *def;
5582 location_t sloc = curr_insn_location ();
5584 /* Look for SSA names that have their last use here (TERed
5585 names always have only one real use). */
5586 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5587 if ((def = get_gimple_for_ssa_name (op)))
5589 imm_use_iterator imm_iter;
5590 use_operand_p use_p;
5591 bool have_debug_uses = false;
5593 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5595 if (gimple_debug_bind_p (USE_STMT (use_p)))
5597 have_debug_uses = true;
5598 break;
5602 if (have_debug_uses)
5604 /* OP is a TERed SSA name, with DEF its defining
5605 statement, and where OP is used in further debug
5606 instructions. Generate a debug temporary, and
5607 replace all uses of OP in debug insns with that
5608 temporary. */
5609 gimple *debugstmt;
5610 tree value = gimple_assign_rhs_to_tree (def);
5611 tree vexpr = make_node (DEBUG_EXPR_DECL);
5612 rtx val;
5613 machine_mode mode;
5615 set_curr_insn_location (gimple_location (def));
5617 DECL_ARTIFICIAL (vexpr) = 1;
5618 TREE_TYPE (vexpr) = TREE_TYPE (value);
5619 if (DECL_P (value))
5620 mode = DECL_MODE (value);
5621 else
5622 mode = TYPE_MODE (TREE_TYPE (value));
5623 SET_DECL_MODE (vexpr, mode);
5625 val = gen_rtx_VAR_LOCATION
5626 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5628 emit_debug_insn (val);
5630 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5632 if (!gimple_debug_bind_p (debugstmt))
5633 continue;
5635 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5636 SET_USE (use_p, vexpr);
5638 update_stmt (debugstmt);
5642 set_curr_insn_location (sloc);
5645 currently_expanding_gimple_stmt = stmt;
5647 /* Expand this statement, then evaluate the resulting RTL and
5648 fixup the CFG accordingly. */
5649 if (gimple_code (stmt) == GIMPLE_COND)
5651 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5652 if (new_bb)
5653 return new_bb;
5655 else if (is_gimple_debug (stmt))
5657 location_t sloc = curr_insn_location ();
5658 gimple_stmt_iterator nsi = gsi;
5660 for (;;)
5662 tree var;
5663 tree value = NULL_TREE;
5664 rtx val = NULL_RTX;
5665 machine_mode mode;
5667 if (!gimple_debug_nonbind_marker_p (stmt))
5669 if (gimple_debug_bind_p (stmt))
5671 var = gimple_debug_bind_get_var (stmt);
5673 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5674 && TREE_CODE (var) != LABEL_DECL
5675 && !target_for_debug_bind (var))
5676 goto delink_debug_stmt;
5678 if (DECL_P (var))
5679 mode = DECL_MODE (var);
5680 else
5681 mode = TYPE_MODE (TREE_TYPE (var));
5683 if (gimple_debug_bind_has_value_p (stmt))
5684 value = gimple_debug_bind_get_value (stmt);
5686 val = gen_rtx_VAR_LOCATION
5687 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5689 else if (gimple_debug_source_bind_p (stmt))
5691 var = gimple_debug_source_bind_get_var (stmt);
5693 value = gimple_debug_source_bind_get_value (stmt);
5695 mode = DECL_MODE (var);
5697 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5698 VAR_INIT_STATUS_UNINITIALIZED);
5700 else
5701 gcc_unreachable ();
5703 /* If this function was first compiled with markers
5704 enabled, but they're now disable (e.g. LTO), drop
5705 them on the floor. */
5706 else if (gimple_debug_nonbind_marker_p (stmt)
5707 && !MAY_HAVE_DEBUG_MARKER_INSNS)
5708 goto delink_debug_stmt;
5709 else if (gimple_debug_begin_stmt_p (stmt))
5710 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
5711 else if (gimple_debug_inline_entry_p (stmt))
5713 tree block = gimple_block (stmt);
5715 if (block)
5716 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
5717 else
5718 goto delink_debug_stmt;
5720 else
5721 gcc_unreachable ();
5723 last = get_last_insn ();
5725 set_curr_insn_location (gimple_location (stmt));
5727 emit_debug_insn (val);
5729 if (dump_file && (dump_flags & TDF_DETAILS))
5731 /* We can't dump the insn with a TREE where an RTX
5732 is expected. */
5733 if (GET_CODE (val) == VAR_LOCATION)
5735 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
5736 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5738 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5739 if (GET_CODE (val) == VAR_LOCATION)
5740 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5743 delink_debug_stmt:
5744 /* In order not to generate too many debug temporaries,
5745 we delink all uses of debug statements we already expanded.
5746 Therefore debug statements between definition and real
5747 use of TERed SSA names will continue to use the SSA name,
5748 and not be replaced with debug temps. */
5749 delink_stmt_imm_use (stmt);
5751 gsi = nsi;
5752 gsi_next (&nsi);
5753 if (gsi_end_p (nsi))
5754 break;
5755 stmt = gsi_stmt (nsi);
5756 if (!is_gimple_debug (stmt))
5757 break;
5760 set_curr_insn_location (sloc);
5762 else
5764 gcall *call_stmt = dyn_cast <gcall *> (stmt);
5765 if (call_stmt
5766 && gimple_call_tail_p (call_stmt)
5767 && disable_tail_calls)
5768 gimple_call_set_tail (call_stmt, false);
5770 if (call_stmt && gimple_call_tail_p (call_stmt))
5772 bool can_fallthru;
5773 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
5774 if (new_bb)
5776 if (can_fallthru)
5777 bb = new_bb;
5778 else
5779 return new_bb;
5782 else
5784 def_operand_p def_p;
5785 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5787 if (def_p != NULL)
5789 /* Ignore this stmt if it is in the list of
5790 replaceable expressions. */
5791 if (SA.values
5792 && bitmap_bit_p (SA.values,
5793 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5794 continue;
5796 last = expand_gimple_stmt (stmt);
5797 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5802 currently_expanding_gimple_stmt = NULL;
5804 /* Expand implicit goto and convert goto_locus. */
5805 FOR_EACH_EDGE (e, ei, bb->succs)
5807 if (e->goto_locus != UNKNOWN_LOCATION)
5808 set_curr_insn_location (e->goto_locus);
5809 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5811 emit_jump (label_rtx_for_bb (e->dest));
5812 e->flags &= ~EDGE_FALLTHRU;
5816 /* Expanded RTL can create a jump in the last instruction of block.
5817 This later might be assumed to be a jump to successor and break edge insertion.
5818 We need to insert dummy move to prevent this. PR41440. */
5819 if (single_succ_p (bb)
5820 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5821 && (last = get_last_insn ())
5822 && (JUMP_P (last)
5823 || (DEBUG_INSN_P (last)
5824 && JUMP_P (prev_nondebug_insn (last)))))
5826 rtx dummy = gen_reg_rtx (SImode);
5827 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5830 do_pending_stack_adjust ();
5832 /* Find the block tail. The last insn in the block is the insn
5833 before a barrier and/or table jump insn. */
5834 last = get_last_insn ();
5835 if (BARRIER_P (last))
5836 last = PREV_INSN (last);
5837 if (JUMP_TABLE_DATA_P (last))
5838 last = PREV_INSN (PREV_INSN (last));
5839 if (BARRIER_P (last))
5840 last = PREV_INSN (last);
5841 BB_END (bb) = last;
5843 update_bb_for_insn (bb);
5845 return bb;
5849 /* Create a basic block for initialization code. */
5851 static basic_block
5852 construct_init_block (void)
5854 basic_block init_block, first_block;
5855 edge e = NULL;
5856 int flags;
5858 /* Multiple entry points not supported yet. */
5859 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5860 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5861 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5862 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5863 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5865 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5867 /* When entry edge points to first basic block, we don't need jump,
5868 otherwise we have to jump into proper target. */
5869 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5871 tree label = gimple_block_label (e->dest);
5873 emit_jump (jump_target_rtx (label));
5874 flags = 0;
5876 else
5877 flags = EDGE_FALLTHRU;
5879 init_block = create_basic_block (NEXT_INSN (get_insns ()),
5880 get_last_insn (),
5881 ENTRY_BLOCK_PTR_FOR_FN (cfun));
5882 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5883 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5884 if (e)
5886 first_block = e->dest;
5887 redirect_edge_succ (e, init_block);
5888 e = make_single_succ_edge (init_block, first_block, flags);
5890 else
5891 e = make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5892 EDGE_FALLTHRU);
5894 update_bb_for_insn (init_block);
5895 return init_block;
5898 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
5899 found in the block tree. */
5901 static void
5902 set_block_levels (tree block, int level)
5904 while (block)
5906 BLOCK_NUMBER (block) = level;
5907 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
5908 block = BLOCK_CHAIN (block);
5912 /* Create a block containing landing pads and similar stuff. */
5914 static void
5915 construct_exit_block (void)
5917 rtx_insn *head = get_last_insn ();
5918 rtx_insn *end;
5919 basic_block exit_block;
5920 edge e, e2;
5921 unsigned ix;
5922 edge_iterator ei;
5923 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
5924 rtx_insn *orig_end = BB_END (prev_bb);
5926 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5928 /* Make sure the locus is set to the end of the function, so that
5929 epilogue line numbers and warnings are set properly. */
5930 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
5931 input_location = cfun->function_end_locus;
5933 /* Generate rtl for function exit. */
5934 expand_function_end ();
5936 end = get_last_insn ();
5937 if (head == end)
5938 return;
5939 /* While emitting the function end we could move end of the last basic
5940 block. */
5941 BB_END (prev_bb) = orig_end;
5942 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
5943 head = NEXT_INSN (head);
5944 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
5945 bb count counting will be confused. Any instructions before that
5946 label are emitted for the case where PREV_BB falls through into the
5947 exit block, so append those instructions to prev_bb in that case. */
5948 if (NEXT_INSN (head) != return_label)
5950 while (NEXT_INSN (head) != return_label)
5952 if (!NOTE_P (NEXT_INSN (head)))
5953 BB_END (prev_bb) = NEXT_INSN (head);
5954 head = NEXT_INSN (head);
5957 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
5958 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5959 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5961 ix = 0;
5962 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
5964 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
5965 if (!(e->flags & EDGE_ABNORMAL))
5966 redirect_edge_succ (e, exit_block);
5967 else
5968 ix++;
5971 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5972 EDGE_FALLTHRU);
5973 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
5974 if (e2 != e)
5976 exit_block->count -= e2->count ();
5978 update_bb_for_insn (exit_block);
5981 /* Helper function for discover_nonconstant_array_refs.
5982 Look for ARRAY_REF nodes with non-constant indexes and mark them
5983 addressable. */
5985 static tree
5986 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
5987 void *data ATTRIBUTE_UNUSED)
5989 tree t = *tp;
5991 if (IS_TYPE_OR_DECL_P (t))
5992 *walk_subtrees = 0;
5993 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5995 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5996 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
5997 && (!TREE_OPERAND (t, 2)
5998 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5999 || (TREE_CODE (t) == COMPONENT_REF
6000 && (!TREE_OPERAND (t,2)
6001 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6002 || TREE_CODE (t) == BIT_FIELD_REF
6003 || TREE_CODE (t) == REALPART_EXPR
6004 || TREE_CODE (t) == IMAGPART_EXPR
6005 || TREE_CODE (t) == VIEW_CONVERT_EXPR
6006 || CONVERT_EXPR_P (t))
6007 t = TREE_OPERAND (t, 0);
6009 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6011 t = get_base_address (t);
6012 if (t && DECL_P (t)
6013 && DECL_MODE (t) != BLKmode)
6014 TREE_ADDRESSABLE (t) = 1;
6017 *walk_subtrees = 0;
6020 return NULL_TREE;
6023 /* RTL expansion is not able to compile array references with variable
6024 offsets for arrays stored in single register. Discover such
6025 expressions and mark variables as addressable to avoid this
6026 scenario. */
6028 static void
6029 discover_nonconstant_array_refs (void)
6031 basic_block bb;
6032 gimple_stmt_iterator gsi;
6034 FOR_EACH_BB_FN (bb, cfun)
6035 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6037 gimple *stmt = gsi_stmt (gsi);
6038 if (!is_gimple_debug (stmt))
6039 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
6043 /* This function sets crtl->args.internal_arg_pointer to a virtual
6044 register if DRAP is needed. Local register allocator will replace
6045 virtual_incoming_args_rtx with the virtual register. */
6047 static void
6048 expand_stack_alignment (void)
6050 rtx drap_rtx;
6051 unsigned int preferred_stack_boundary;
6053 if (! SUPPORTS_STACK_ALIGNMENT)
6054 return;
6056 if (cfun->calls_alloca
6057 || cfun->has_nonlocal_label
6058 || crtl->has_nonlocal_goto)
6059 crtl->need_drap = true;
6061 /* Call update_stack_boundary here again to update incoming stack
6062 boundary. It may set incoming stack alignment to a different
6063 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6064 use the minimum incoming stack alignment to check if it is OK
6065 to perform sibcall optimization since sibcall optimization will
6066 only align the outgoing stack to incoming stack boundary. */
6067 if (targetm.calls.update_stack_boundary)
6068 targetm.calls.update_stack_boundary ();
6070 /* The incoming stack frame has to be aligned at least at
6071 parm_stack_boundary. */
6072 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6074 /* Update crtl->stack_alignment_estimated and use it later to align
6075 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6076 exceptions since callgraph doesn't collect incoming stack alignment
6077 in this case. */
6078 if (cfun->can_throw_non_call_exceptions
6079 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6080 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6081 else
6082 preferred_stack_boundary = crtl->preferred_stack_boundary;
6083 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6084 crtl->stack_alignment_estimated = preferred_stack_boundary;
6085 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6086 crtl->stack_alignment_needed = preferred_stack_boundary;
6088 gcc_assert (crtl->stack_alignment_needed
6089 <= crtl->stack_alignment_estimated);
6091 crtl->stack_realign_needed
6092 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6093 crtl->stack_realign_tried = crtl->stack_realign_needed;
6095 crtl->stack_realign_processed = true;
6097 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6098 alignment. */
6099 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6100 drap_rtx = targetm.calls.get_drap_rtx ();
6102 /* stack_realign_drap and drap_rtx must match. */
6103 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6105 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6106 if (drap_rtx != NULL)
6108 crtl->args.internal_arg_pointer = drap_rtx;
6110 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6111 needed. */
6112 fixup_tail_calls ();
6117 static void
6118 expand_main_function (void)
6120 #if (defined(INVOKE__main) \
6121 || (!defined(HAS_INIT_SECTION) \
6122 && !defined(INIT_SECTION_ASM_OP) \
6123 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6124 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6125 #endif
6129 /* Expand code to initialize the stack_protect_guard. This is invoked at
6130 the beginning of a function to be protected. */
6132 static void
6133 stack_protect_prologue (void)
6135 tree guard_decl = targetm.stack_protect_guard ();
6136 rtx x, y;
6138 x = expand_normal (crtl->stack_protect_guard);
6139 if (guard_decl)
6140 y = expand_normal (guard_decl);
6141 else
6142 y = const0_rtx;
6144 /* Allow the target to copy from Y to X without leaking Y into a
6145 register. */
6146 if (targetm.have_stack_protect_set ())
6147 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6149 emit_insn (insn);
6150 return;
6153 /* Otherwise do a straight move. */
6154 emit_move_insn (x, y);
6157 /* Translate the intermediate representation contained in the CFG
6158 from GIMPLE trees to RTL.
6160 We do conversion per basic block and preserve/update the tree CFG.
6161 This implies we have to do some magic as the CFG can simultaneously
6162 consist of basic blocks containing RTL and GIMPLE trees. This can
6163 confuse the CFG hooks, so be careful to not manipulate CFG during
6164 the expansion. */
6166 namespace {
6168 const pass_data pass_data_expand =
6170 RTL_PASS, /* type */
6171 "expand", /* name */
6172 OPTGROUP_NONE, /* optinfo_flags */
6173 TV_EXPAND, /* tv_id */
6174 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6175 | PROP_gimple_lcx
6176 | PROP_gimple_lvec
6177 | PROP_gimple_lva), /* properties_required */
6178 PROP_rtl, /* properties_provided */
6179 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
6180 0, /* todo_flags_start */
6181 0, /* todo_flags_finish */
6184 class pass_expand : public rtl_opt_pass
6186 public:
6187 pass_expand (gcc::context *ctxt)
6188 : rtl_opt_pass (pass_data_expand, ctxt)
6191 /* opt_pass methods: */
6192 virtual unsigned int execute (function *);
6194 }; // class pass_expand
6196 unsigned int
6197 pass_expand::execute (function *fun)
6199 basic_block bb, init_block;
6200 edge_iterator ei;
6201 edge e;
6202 rtx_insn *var_seq, *var_ret_seq;
6203 unsigned i;
6205 timevar_push (TV_OUT_OF_SSA);
6206 rewrite_out_of_ssa (&SA);
6207 timevar_pop (TV_OUT_OF_SSA);
6208 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6210 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6212 gimple_stmt_iterator gsi;
6213 FOR_EACH_BB_FN (bb, cfun)
6214 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6215 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6216 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6219 /* Make sure all values used by the optimization passes have sane
6220 defaults. */
6221 reg_renumber = 0;
6223 /* Some backends want to know that we are expanding to RTL. */
6224 currently_expanding_to_rtl = 1;
6225 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6226 free_dominance_info (CDI_DOMINATORS);
6228 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6230 insn_locations_init ();
6231 if (!DECL_IS_BUILTIN (current_function_decl))
6233 /* Eventually, all FEs should explicitly set function_start_locus. */
6234 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6235 set_curr_insn_location
6236 (DECL_SOURCE_LOCATION (current_function_decl));
6237 else
6238 set_curr_insn_location (fun->function_start_locus);
6240 else
6241 set_curr_insn_location (UNKNOWN_LOCATION);
6242 prologue_location = curr_insn_location ();
6244 #ifdef INSN_SCHEDULING
6245 init_sched_attrs ();
6246 #endif
6248 /* Make sure first insn is a note even if we don't want linenums.
6249 This makes sure the first insn will never be deleted.
6250 Also, final expects a note to appear there. */
6251 emit_note (NOTE_INSN_DELETED);
6253 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6254 discover_nonconstant_array_refs ();
6256 targetm.expand_to_rtl_hook ();
6257 crtl->init_stack_alignment ();
6258 fun->cfg->max_jumptable_ents = 0;
6260 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6261 of the function section at exapnsion time to predict distance of calls. */
6262 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6264 /* Expand the variables recorded during gimple lowering. */
6265 timevar_push (TV_VAR_EXPAND);
6266 start_sequence ();
6268 var_ret_seq = expand_used_vars ();
6270 var_seq = get_insns ();
6271 end_sequence ();
6272 timevar_pop (TV_VAR_EXPAND);
6274 /* Honor stack protection warnings. */
6275 if (warn_stack_protect)
6277 if (fun->calls_alloca)
6278 warning (OPT_Wstack_protector,
6279 "stack protector not protecting local variables: "
6280 "variable length buffer");
6281 if (has_short_buffer && !crtl->stack_protect_guard)
6282 warning (OPT_Wstack_protector,
6283 "stack protector not protecting function: "
6284 "all local arrays are less than %d bytes long",
6285 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE));
6288 /* Set up parameters and prepare for return, for the function. */
6289 expand_function_start (current_function_decl);
6291 /* If we emitted any instructions for setting up the variables,
6292 emit them before the FUNCTION_START note. */
6293 if (var_seq)
6295 emit_insn_before (var_seq, parm_birth_insn);
6297 /* In expand_function_end we'll insert the alloca save/restore
6298 before parm_birth_insn. We've just insertted an alloca call.
6299 Adjust the pointer to match. */
6300 parm_birth_insn = var_seq;
6303 /* Now propagate the RTL assignment of each partition to the
6304 underlying var of each SSA_NAME. */
6305 tree name;
6307 FOR_EACH_SSA_NAME (i, name, cfun)
6309 /* We might have generated new SSA names in
6310 update_alias_info_with_stack_vars. They will have a NULL
6311 defining statements, and won't be part of the partitioning,
6312 so ignore those. */
6313 if (!SSA_NAME_DEF_STMT (name))
6314 continue;
6316 adjust_one_expanded_partition_var (name);
6319 /* Clean up RTL of variables that straddle across multiple
6320 partitions, and check that the rtl of any PARM_DECLs that are not
6321 cleaned up is that of their default defs. */
6322 FOR_EACH_SSA_NAME (i, name, cfun)
6324 int part;
6326 /* We might have generated new SSA names in
6327 update_alias_info_with_stack_vars. They will have a NULL
6328 defining statements, and won't be part of the partitioning,
6329 so ignore those. */
6330 if (!SSA_NAME_DEF_STMT (name))
6331 continue;
6332 part = var_to_partition (SA.map, name);
6333 if (part == NO_PARTITION)
6334 continue;
6336 /* If this decl was marked as living in multiple places, reset
6337 this now to NULL. */
6338 tree var = SSA_NAME_VAR (name);
6339 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6340 SET_DECL_RTL (var, NULL);
6341 /* Check that the pseudos chosen by assign_parms are those of
6342 the corresponding default defs. */
6343 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6344 && (TREE_CODE (var) == PARM_DECL
6345 || TREE_CODE (var) == RESULT_DECL))
6347 rtx in = DECL_RTL_IF_SET (var);
6348 gcc_assert (in);
6349 rtx out = SA.partition_to_pseudo[part];
6350 gcc_assert (in == out);
6352 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6353 those expected by debug backends for each parm and for
6354 the result. This is particularly important for stabs,
6355 whose register elimination from parm's DECL_RTL may cause
6356 -fcompare-debug differences as SET_DECL_RTL changes reg's
6357 attrs. So, make sure the RTL already has the parm as the
6358 EXPR, so that it won't change. */
6359 SET_DECL_RTL (var, NULL_RTX);
6360 if (MEM_P (in))
6361 set_mem_attributes (in, var, true);
6362 SET_DECL_RTL (var, in);
6366 /* If this function is `main', emit a call to `__main'
6367 to run global initializers, etc. */
6368 if (DECL_NAME (current_function_decl)
6369 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6370 && DECL_FILE_SCOPE_P (current_function_decl))
6371 expand_main_function ();
6373 /* Initialize the stack_protect_guard field. This must happen after the
6374 call to __main (if any) so that the external decl is initialized. */
6375 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6376 stack_protect_prologue ();
6378 expand_phi_nodes (&SA);
6380 /* Release any stale SSA redirection data. */
6381 redirect_edge_var_map_empty ();
6383 /* Register rtl specific functions for cfg. */
6384 rtl_register_cfg_hooks ();
6386 init_block = construct_init_block ();
6388 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6389 remaining edges later. */
6390 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6391 e->flags &= ~EDGE_EXECUTABLE;
6393 /* If the function has too many markers, drop them while expanding. */
6394 if (cfun->debug_marker_count
6395 >= PARAM_VALUE (PARAM_MAX_DEBUG_MARKER_COUNT))
6396 cfun->debug_nonbind_markers = false;
6398 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6399 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6400 next_bb)
6401 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6403 if (MAY_HAVE_DEBUG_BIND_INSNS)
6404 expand_debug_locations ();
6406 if (deep_ter_debug_map)
6408 delete deep_ter_debug_map;
6409 deep_ter_debug_map = NULL;
6412 /* Free stuff we no longer need after GIMPLE optimizations. */
6413 free_dominance_info (CDI_DOMINATORS);
6414 free_dominance_info (CDI_POST_DOMINATORS);
6415 delete_tree_cfg_annotations (fun);
6417 timevar_push (TV_OUT_OF_SSA);
6418 finish_out_of_ssa (&SA);
6419 timevar_pop (TV_OUT_OF_SSA);
6421 timevar_push (TV_POST_EXPAND);
6422 /* We are no longer in SSA form. */
6423 fun->gimple_df->in_ssa_p = false;
6424 loops_state_clear (LOOP_CLOSED_SSA);
6426 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6427 conservatively to true until they are all profile aware. */
6428 delete lab_rtx_for_bb;
6429 free_histograms (fun);
6431 construct_exit_block ();
6432 insn_locations_finalize ();
6434 if (var_ret_seq)
6436 rtx_insn *after = return_label;
6437 rtx_insn *next = NEXT_INSN (after);
6438 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6439 after = next;
6440 emit_insn_after (var_ret_seq, after);
6443 /* Zap the tree EH table. */
6444 set_eh_throw_stmt_table (fun, NULL);
6446 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6447 split edges which edge insertions might do. */
6448 rebuild_jump_labels (get_insns ());
6450 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun),
6451 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6453 edge e;
6454 edge_iterator ei;
6455 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6457 if (e->insns.r)
6459 rebuild_jump_labels_chain (e->insns.r);
6460 /* Put insns after parm birth, but before
6461 NOTE_INSNS_FUNCTION_BEG. */
6462 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (fun)
6463 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6465 rtx_insn *insns = e->insns.r;
6466 e->insns.r = NULL;
6467 if (NOTE_P (parm_birth_insn)
6468 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6469 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6470 else
6471 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6473 else
6474 commit_one_edge_insertion (e);
6476 else
6477 ei_next (&ei);
6481 /* We're done expanding trees to RTL. */
6482 currently_expanding_to_rtl = 0;
6484 flush_mark_addressable_queue ();
6486 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6487 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6489 edge e;
6490 edge_iterator ei;
6491 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6493 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6494 e->flags &= ~EDGE_EXECUTABLE;
6496 /* At the moment not all abnormal edges match the RTL
6497 representation. It is safe to remove them here as
6498 find_many_sub_basic_blocks will rediscover them.
6499 In the future we should get this fixed properly. */
6500 if ((e->flags & EDGE_ABNORMAL)
6501 && !(e->flags & EDGE_SIBCALL))
6502 remove_edge (e);
6503 else
6504 ei_next (&ei);
6508 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6509 bitmap_ones (blocks);
6510 find_many_sub_basic_blocks (blocks);
6511 purge_all_dead_edges ();
6513 expand_stack_alignment ();
6515 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6516 function. */
6517 if (crtl->tail_call_emit)
6518 fixup_tail_calls ();
6520 /* After initial rtl generation, call back to finish generating
6521 exception support code. We need to do this before cleaning up
6522 the CFG as the code does not expect dead landing pads. */
6523 if (fun->eh->region_tree != NULL)
6524 finish_eh_generation ();
6526 /* BB subdivision may have created basic blocks that are are only reachable
6527 from unlikely bbs but not marked as such in the profile. */
6528 if (optimize)
6529 propagate_unlikely_bbs_forward ();
6531 /* Remove unreachable blocks, otherwise we cannot compute dominators
6532 which are needed for loop state verification. As a side-effect
6533 this also compacts blocks.
6534 ??? We cannot remove trivially dead insns here as for example
6535 the DRAP reg on i?86 is not magically live at this point.
6536 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6537 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6539 checking_verify_flow_info ();
6541 /* Initialize pseudos allocated for hard registers. */
6542 emit_initial_value_sets ();
6544 /* And finally unshare all RTL. */
6545 unshare_all_rtl ();
6547 /* There's no need to defer outputting this function any more; we
6548 know we want to output it. */
6549 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6551 /* Now that we're done expanding trees to RTL, we shouldn't have any
6552 more CONCATs anywhere. */
6553 generating_concat_p = 0;
6555 if (dump_file)
6557 fprintf (dump_file,
6558 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6559 /* And the pass manager will dump RTL for us. */
6562 /* If we're emitting a nested function, make sure its parent gets
6563 emitted as well. Doing otherwise confuses debug info. */
6565 tree parent;
6566 for (parent = DECL_CONTEXT (current_function_decl);
6567 parent != NULL_TREE;
6568 parent = get_containing_scope (parent))
6569 if (TREE_CODE (parent) == FUNCTION_DECL)
6570 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6573 TREE_ASM_WRITTEN (current_function_decl) = 1;
6575 /* After expanding, the return labels are no longer needed. */
6576 return_label = NULL;
6577 naked_return_label = NULL;
6579 /* After expanding, the tm_restart map is no longer needed. */
6580 if (fun->gimple_df->tm_restart)
6581 fun->gimple_df->tm_restart = NULL;
6583 /* Tag the blocks with a depth number so that change_scope can find
6584 the common parent easily. */
6585 set_block_levels (DECL_INITIAL (fun->decl), 0);
6586 default_rtl_profile ();
6588 /* For -dx discard loops now, otherwise IL verify in clean_state will
6589 ICE. */
6590 if (rtl_dump_and_exit)
6592 cfun->curr_properties &= ~PROP_loops;
6593 loop_optimizer_finalize ();
6596 timevar_pop (TV_POST_EXPAND);
6598 return 0;
6601 } // anon namespace
6603 rtl_opt_pass *
6604 make_pass_expand (gcc::context *ctxt)
6606 return new pass_expand (ctxt);