PR middle-end/86864
[official-gcc.git] / gcc / cfgexpand.c
blobc8d7805308c464a443dc003c25094e0ca99f976a
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2018 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "params.h"
65 #include "tree-inline.h"
66 #include "value-prof.h"
67 #include "tree-ssa-live.h"
68 #include "tree-outof-ssa.h"
69 #include "cfgloop.h"
70 #include "insn-attr.h" /* For INSN_SCHEDULING. */
71 #include "stringpool.h"
72 #include "attribs.h"
73 #include "asan.h"
74 #include "tree-ssa-address.h"
75 #include "output.h"
76 #include "builtins.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 enum gimple_rhs_class grhs_class;
109 grhs_class = get_gimple_rhs_class (gimple_expr_code (stmt));
111 if (grhs_class == GIMPLE_TERNARY_RHS)
112 t = build3 (gimple_assign_rhs_code (stmt),
113 TREE_TYPE (gimple_assign_lhs (stmt)),
114 gimple_assign_rhs1 (stmt),
115 gimple_assign_rhs2 (stmt),
116 gimple_assign_rhs3 (stmt));
117 else if (grhs_class == GIMPLE_BINARY_RHS)
118 t = build2 (gimple_assign_rhs_code (stmt),
119 TREE_TYPE (gimple_assign_lhs (stmt)),
120 gimple_assign_rhs1 (stmt),
121 gimple_assign_rhs2 (stmt));
122 else if (grhs_class == GIMPLE_UNARY_RHS)
123 t = build1 (gimple_assign_rhs_code (stmt),
124 TREE_TYPE (gimple_assign_lhs (stmt)),
125 gimple_assign_rhs1 (stmt));
126 else if (grhs_class == GIMPLE_SINGLE_RHS)
128 t = gimple_assign_rhs1 (stmt);
129 /* Avoid modifying this tree in place below. */
130 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
131 && gimple_location (stmt) != EXPR_LOCATION (t))
132 || (gimple_block (stmt)
133 && currently_expanding_to_rtl
134 && EXPR_P (t)))
135 t = copy_node (t);
137 else
138 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 struct stack_var
310 /* The Variable. */
311 tree decl;
313 /* Initially, the size of the variable. Later, the size of the partition,
314 if this variable becomes it's partition's representative. */
315 poly_uint64 size;
317 /* The *byte* alignment required for this variable. Or as, with the
318 size, the alignment for this partition. */
319 unsigned int alignb;
321 /* The partition representative. */
322 size_t representative;
324 /* The next stack variable in the partition, or EOC. */
325 size_t next;
327 /* The numbers of conflicting stack variables. */
328 bitmap conflicts;
331 #define EOC ((size_t)-1)
333 /* We have an array of such objects while deciding allocation. */
334 static struct stack_var *stack_vars;
335 static size_t stack_vars_alloc;
336 static size_t stack_vars_num;
337 static hash_map<tree, size_t> *decl_to_stack_part;
339 /* Conflict bitmaps go on this obstack. This allows us to destroy
340 all of them in one big sweep. */
341 static bitmap_obstack stack_var_bitmap_obstack;
343 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
344 is non-decreasing. */
345 static size_t *stack_vars_sorted;
347 /* The phase of the stack frame. This is the known misalignment of
348 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
349 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
350 static int frame_phase;
352 /* Used during expand_used_vars to remember if we saw any decls for
353 which we'd like to enable stack smashing protection. */
354 static bool has_protected_decls;
356 /* Used during expand_used_vars. Remember if we say a character buffer
357 smaller than our cutoff threshold. Used for -Wstack-protector. */
358 static bool has_short_buffer;
360 /* Compute the byte alignment to use for DECL. Ignore alignment
361 we can't do with expected alignment of the stack boundary. */
363 static unsigned int
364 align_local_variable (tree decl)
366 unsigned int align;
368 if (TREE_CODE (decl) == SSA_NAME)
369 align = TYPE_ALIGN (TREE_TYPE (decl));
370 else
372 align = LOCAL_DECL_ALIGNMENT (decl);
373 SET_DECL_ALIGN (decl, align);
375 return align / BITS_PER_UNIT;
378 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
379 down otherwise. Return truncated BASE value. */
381 static inline unsigned HOST_WIDE_INT
382 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
384 return align_up ? (base + align - 1) & -align : base & -align;
387 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
388 Return the frame offset. */
390 static poly_int64
391 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
393 poly_int64 offset, new_frame_offset;
395 if (FRAME_GROWS_DOWNWARD)
397 new_frame_offset
398 = aligned_lower_bound (frame_offset - frame_phase - size,
399 align) + frame_phase;
400 offset = new_frame_offset;
402 else
404 new_frame_offset
405 = aligned_upper_bound (frame_offset - frame_phase,
406 align) + frame_phase;
407 offset = new_frame_offset;
408 new_frame_offset += size;
410 frame_offset = new_frame_offset;
412 if (frame_offset_overflow (frame_offset, cfun->decl))
413 frame_offset = offset = 0;
415 return offset;
418 /* Accumulate DECL into STACK_VARS. */
420 static void
421 add_stack_var (tree decl)
423 struct stack_var *v;
425 if (stack_vars_num >= stack_vars_alloc)
427 if (stack_vars_alloc)
428 stack_vars_alloc = stack_vars_alloc * 3 / 2;
429 else
430 stack_vars_alloc = 32;
431 stack_vars
432 = XRESIZEVEC (struct stack_var, stack_vars, stack_vars_alloc);
434 if (!decl_to_stack_part)
435 decl_to_stack_part = new hash_map<tree, size_t>;
437 v = &stack_vars[stack_vars_num];
438 decl_to_stack_part->put (decl, stack_vars_num);
440 v->decl = decl;
441 tree size = TREE_CODE (decl) == SSA_NAME
442 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
443 : DECL_SIZE_UNIT (decl);
444 v->size = tree_to_poly_uint64 (size);
445 /* Ensure that all variables have size, so that &a != &b for any two
446 variables that are simultaneously live. */
447 if (known_eq (v->size, 0U))
448 v->size = 1;
449 v->alignb = align_local_variable (decl);
450 /* An alignment of zero can mightily confuse us later. */
451 gcc_assert (v->alignb != 0);
453 /* All variables are initially in their own partition. */
454 v->representative = stack_vars_num;
455 v->next = EOC;
457 /* All variables initially conflict with no other. */
458 v->conflicts = NULL;
460 /* Ensure that this decl doesn't get put onto the list twice. */
461 set_rtl (decl, pc_rtx);
463 stack_vars_num++;
466 /* Make the decls associated with luid's X and Y conflict. */
468 static void
469 add_stack_var_conflict (size_t x, size_t y)
471 struct stack_var *a = &stack_vars[x];
472 struct stack_var *b = &stack_vars[y];
473 if (!a->conflicts)
474 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
475 if (!b->conflicts)
476 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
477 bitmap_set_bit (a->conflicts, y);
478 bitmap_set_bit (b->conflicts, x);
481 /* Check whether the decls associated with luid's X and Y conflict. */
483 static bool
484 stack_var_conflict_p (size_t x, size_t y)
486 struct stack_var *a = &stack_vars[x];
487 struct stack_var *b = &stack_vars[y];
488 if (x == y)
489 return false;
490 /* Partitions containing an SSA name result from gimple registers
491 with things like unsupported modes. They are top-level and
492 hence conflict with everything else. */
493 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
494 return true;
496 if (!a->conflicts || !b->conflicts)
497 return false;
498 return bitmap_bit_p (a->conflicts, y);
501 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
502 enter its partition number into bitmap DATA. */
504 static bool
505 visit_op (gimple *, tree op, tree, void *data)
507 bitmap active = (bitmap)data;
508 op = get_base_address (op);
509 if (op
510 && DECL_P (op)
511 && DECL_RTL_IF_SET (op) == pc_rtx)
513 size_t *v = decl_to_stack_part->get (op);
514 if (v)
515 bitmap_set_bit (active, *v);
517 return false;
520 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
521 record conflicts between it and all currently active other partitions
522 from bitmap DATA. */
524 static bool
525 visit_conflict (gimple *, tree op, tree, void *data)
527 bitmap active = (bitmap)data;
528 op = get_base_address (op);
529 if (op
530 && DECL_P (op)
531 && DECL_RTL_IF_SET (op) == pc_rtx)
533 size_t *v = decl_to_stack_part->get (op);
534 if (v && bitmap_set_bit (active, *v))
536 size_t num = *v;
537 bitmap_iterator bi;
538 unsigned i;
539 gcc_assert (num < stack_vars_num);
540 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
541 add_stack_var_conflict (num, i);
544 return false;
547 /* Helper routine for add_scope_conflicts, calculating the active partitions
548 at the end of BB, leaving the result in WORK. We're called to generate
549 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
550 liveness. */
552 static void
553 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
555 edge e;
556 edge_iterator ei;
557 gimple_stmt_iterator gsi;
558 walk_stmt_load_store_addr_fn visit;
560 bitmap_clear (work);
561 FOR_EACH_EDGE (e, ei, bb->preds)
562 bitmap_ior_into (work, (bitmap)e->src->aux);
564 visit = visit_op;
566 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
568 gimple *stmt = gsi_stmt (gsi);
569 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
571 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
573 gimple *stmt = gsi_stmt (gsi);
575 if (gimple_clobber_p (stmt))
577 tree lhs = gimple_assign_lhs (stmt);
578 size_t *v;
579 /* Nested function lowering might introduce LHSs
580 that are COMPONENT_REFs. */
581 if (!VAR_P (lhs))
582 continue;
583 if (DECL_RTL_IF_SET (lhs) == pc_rtx
584 && (v = decl_to_stack_part->get (lhs)))
585 bitmap_clear_bit (work, *v);
587 else if (!is_gimple_debug (stmt))
589 if (for_conflict
590 && visit == visit_op)
592 /* If this is the first real instruction in this BB we need
593 to add conflicts for everything live at this point now.
594 Unlike classical liveness for named objects we can't
595 rely on seeing a def/use of the names we're interested in.
596 There might merely be indirect loads/stores. We'd not add any
597 conflicts for such partitions. */
598 bitmap_iterator bi;
599 unsigned i;
600 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
602 struct stack_var *a = &stack_vars[i];
603 if (!a->conflicts)
604 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
605 bitmap_ior_into (a->conflicts, work);
607 visit = visit_conflict;
609 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
614 /* Generate stack partition conflicts between all partitions that are
615 simultaneously live. */
617 static void
618 add_scope_conflicts (void)
620 basic_block bb;
621 bool changed;
622 bitmap work = BITMAP_ALLOC (NULL);
623 int *rpo;
624 int n_bbs;
626 /* We approximate the live range of a stack variable by taking the first
627 mention of its name as starting point(s), and by the end-of-scope
628 death clobber added by gimplify as ending point(s) of the range.
629 This overapproximates in the case we for instance moved an address-taken
630 operation upward, without also moving a dereference to it upwards.
631 But it's conservatively correct as a variable never can hold values
632 before its name is mentioned at least once.
634 We then do a mostly classical bitmap liveness algorithm. */
636 FOR_ALL_BB_FN (bb, cfun)
637 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
639 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
640 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
642 changed = true;
643 while (changed)
645 int i;
646 changed = false;
647 for (i = 0; i < n_bbs; i++)
649 bitmap active;
650 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
651 active = (bitmap)bb->aux;
652 add_scope_conflicts_1 (bb, work, false);
653 if (bitmap_ior_into (active, work))
654 changed = true;
658 FOR_EACH_BB_FN (bb, cfun)
659 add_scope_conflicts_1 (bb, work, true);
661 free (rpo);
662 BITMAP_FREE (work);
663 FOR_ALL_BB_FN (bb, cfun)
664 BITMAP_FREE (bb->aux);
667 /* A subroutine of partition_stack_vars. A comparison function for qsort,
668 sorting an array of indices by the properties of the object. */
670 static int
671 stack_var_cmp (const void *a, const void *b)
673 size_t ia = *(const size_t *)a;
674 size_t ib = *(const size_t *)b;
675 unsigned int aligna = stack_vars[ia].alignb;
676 unsigned int alignb = stack_vars[ib].alignb;
677 poly_int64 sizea = stack_vars[ia].size;
678 poly_int64 sizeb = stack_vars[ib].size;
679 tree decla = stack_vars[ia].decl;
680 tree declb = stack_vars[ib].decl;
681 bool largea, largeb;
682 unsigned int uida, uidb;
684 /* Primary compare on "large" alignment. Large comes first. */
685 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
686 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
687 if (largea != largeb)
688 return (int)largeb - (int)largea;
690 /* Secondary compare on size, decreasing */
691 int diff = compare_sizes_for_sort (sizeb, sizea);
692 if (diff != 0)
693 return diff;
695 /* Tertiary compare on true alignment, decreasing. */
696 if (aligna < alignb)
697 return -1;
698 if (aligna > alignb)
699 return 1;
701 /* Final compare on ID for sort stability, increasing.
702 Two SSA names are compared by their version, SSA names come before
703 non-SSA names, and two normal decls are compared by their DECL_UID. */
704 if (TREE_CODE (decla) == SSA_NAME)
706 if (TREE_CODE (declb) == SSA_NAME)
707 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
708 else
709 return -1;
711 else if (TREE_CODE (declb) == SSA_NAME)
712 return 1;
713 else
714 uida = DECL_UID (decla), uidb = DECL_UID (declb);
715 if (uida < uidb)
716 return 1;
717 if (uida > uidb)
718 return -1;
719 return 0;
722 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
723 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
725 /* If the points-to solution *PI points to variables that are in a partition
726 together with other variables add all partition members to the pointed-to
727 variables bitmap. */
729 static void
730 add_partitioned_vars_to_ptset (struct pt_solution *pt,
731 part_hashmap *decls_to_partitions,
732 hash_set<bitmap> *visited, bitmap temp)
734 bitmap_iterator bi;
735 unsigned i;
736 bitmap *part;
738 if (pt->anything
739 || pt->vars == NULL
740 /* The pointed-to vars bitmap is shared, it is enough to
741 visit it once. */
742 || visited->add (pt->vars))
743 return;
745 bitmap_clear (temp);
747 /* By using a temporary bitmap to store all members of the partitions
748 we have to add we make sure to visit each of the partitions only
749 once. */
750 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
751 if ((!temp
752 || !bitmap_bit_p (temp, i))
753 && (part = decls_to_partitions->get (i)))
754 bitmap_ior_into (temp, *part);
755 if (!bitmap_empty_p (temp))
756 bitmap_ior_into (pt->vars, temp);
759 /* Update points-to sets based on partition info, so we can use them on RTL.
760 The bitmaps representing stack partitions will be saved until expand,
761 where partitioned decls used as bases in memory expressions will be
762 rewritten. */
764 static void
765 update_alias_info_with_stack_vars (void)
767 part_hashmap *decls_to_partitions = NULL;
768 size_t i, j;
769 tree var = NULL_TREE;
771 for (i = 0; i < stack_vars_num; i++)
773 bitmap part = NULL;
774 tree name;
775 struct ptr_info_def *pi;
777 /* Not interested in partitions with single variable. */
778 if (stack_vars[i].representative != i
779 || stack_vars[i].next == EOC)
780 continue;
782 if (!decls_to_partitions)
784 decls_to_partitions = new part_hashmap;
785 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
788 /* Create an SSA_NAME that points to the partition for use
789 as base during alias-oracle queries on RTL for bases that
790 have been partitioned. */
791 if (var == NULL_TREE)
792 var = create_tmp_var (ptr_type_node);
793 name = make_ssa_name (var);
795 /* Create bitmaps representing partitions. They will be used for
796 points-to sets later, so use GGC alloc. */
797 part = BITMAP_GGC_ALLOC ();
798 for (j = i; j != EOC; j = stack_vars[j].next)
800 tree decl = stack_vars[j].decl;
801 unsigned int uid = DECL_PT_UID (decl);
802 bitmap_set_bit (part, uid);
803 decls_to_partitions->put (uid, part);
804 cfun->gimple_df->decls_to_pointers->put (decl, name);
805 if (TREE_ADDRESSABLE (decl))
806 TREE_ADDRESSABLE (name) = 1;
809 /* Make the SSA name point to all partition members. */
810 pi = get_ptr_info (name);
811 pt_solution_set (&pi->pt, part, false);
814 /* Make all points-to sets that contain one member of a partition
815 contain all members of the partition. */
816 if (decls_to_partitions)
818 unsigned i;
819 tree name;
820 hash_set<bitmap> visited;
821 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
823 FOR_EACH_SSA_NAME (i, name, cfun)
825 struct ptr_info_def *pi;
827 if (POINTER_TYPE_P (TREE_TYPE (name))
828 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
829 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
830 &visited, temp);
833 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
834 decls_to_partitions, &visited, temp);
836 delete decls_to_partitions;
837 BITMAP_FREE (temp);
841 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
842 partitioning algorithm. Partitions A and B are known to be non-conflicting.
843 Merge them into a single partition A. */
845 static void
846 union_stack_vars (size_t a, size_t b)
848 struct stack_var *vb = &stack_vars[b];
849 bitmap_iterator bi;
850 unsigned u;
852 gcc_assert (stack_vars[b].next == EOC);
853 /* Add B to A's partition. */
854 stack_vars[b].next = stack_vars[a].next;
855 stack_vars[b].representative = a;
856 stack_vars[a].next = b;
858 /* Update the required alignment of partition A to account for B. */
859 if (stack_vars[a].alignb < stack_vars[b].alignb)
860 stack_vars[a].alignb = stack_vars[b].alignb;
862 /* Update the interference graph and merge the conflicts. */
863 if (vb->conflicts)
865 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
866 add_stack_var_conflict (a, stack_vars[u].representative);
867 BITMAP_FREE (vb->conflicts);
871 /* A subroutine of expand_used_vars. Binpack the variables into
872 partitions constrained by the interference graph. The overall
873 algorithm used is as follows:
875 Sort the objects by size in descending order.
876 For each object A {
877 S = size(A)
878 O = 0
879 loop {
880 Look for the largest non-conflicting object B with size <= S.
881 UNION (A, B)
886 static void
887 partition_stack_vars (void)
889 size_t si, sj, n = stack_vars_num;
891 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
892 for (si = 0; si < n; ++si)
893 stack_vars_sorted[si] = si;
895 if (n == 1)
896 return;
898 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
900 for (si = 0; si < n; ++si)
902 size_t i = stack_vars_sorted[si];
903 unsigned int ialign = stack_vars[i].alignb;
904 poly_int64 isize = stack_vars[i].size;
906 /* Ignore objects that aren't partition representatives. If we
907 see a var that is not a partition representative, it must
908 have been merged earlier. */
909 if (stack_vars[i].representative != i)
910 continue;
912 for (sj = si + 1; sj < n; ++sj)
914 size_t j = stack_vars_sorted[sj];
915 unsigned int jalign = stack_vars[j].alignb;
916 poly_int64 jsize = stack_vars[j].size;
918 /* Ignore objects that aren't partition representatives. */
919 if (stack_vars[j].representative != j)
920 continue;
922 /* Do not mix objects of "small" (supported) alignment
923 and "large" (unsupported) alignment. */
924 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
925 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
926 break;
928 /* For Address Sanitizer do not mix objects with different
929 sizes, as the shorter vars wouldn't be adequately protected.
930 Don't do that for "large" (unsupported) alignment objects,
931 those aren't protected anyway. */
932 if (asan_sanitize_stack_p ()
933 && maybe_ne (isize, jsize)
934 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
935 break;
937 /* Ignore conflicting objects. */
938 if (stack_var_conflict_p (i, j))
939 continue;
941 /* UNION the objects, placing J at OFFSET. */
942 union_stack_vars (i, j);
946 update_alias_info_with_stack_vars ();
949 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
951 static void
952 dump_stack_var_partition (void)
954 size_t si, i, j, n = stack_vars_num;
956 for (si = 0; si < n; ++si)
958 i = stack_vars_sorted[si];
960 /* Skip variables that aren't partition representatives, for now. */
961 if (stack_vars[i].representative != i)
962 continue;
964 fprintf (dump_file, "Partition %lu: size ", (unsigned long) i);
965 print_dec (stack_vars[i].size, dump_file);
966 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
968 for (j = i; j != EOC; j = stack_vars[j].next)
970 fputc ('\t', dump_file);
971 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
973 fputc ('\n', dump_file);
977 /* Assign rtl to DECL at BASE + OFFSET. */
979 static void
980 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
981 poly_int64 offset)
983 unsigned align;
984 rtx x;
986 /* If this fails, we've overflowed the stack frame. Error nicely? */
987 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
989 x = plus_constant (Pmode, base, offset);
990 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
991 ? TYPE_MODE (TREE_TYPE (decl))
992 : DECL_MODE (SSAVAR (decl)), x);
994 if (TREE_CODE (decl) != SSA_NAME)
996 /* Set alignment we actually gave this decl if it isn't an SSA name.
997 If it is we generate stack slots only accidentally so it isn't as
998 important, we'll simply use the alignment that is already set. */
999 if (base == virtual_stack_vars_rtx)
1000 offset -= frame_phase;
1001 align = known_alignment (offset);
1002 align *= BITS_PER_UNIT;
1003 if (align == 0 || align > base_align)
1004 align = base_align;
1006 /* One would think that we could assert that we're not decreasing
1007 alignment here, but (at least) the i386 port does exactly this
1008 via the MINIMUM_ALIGNMENT hook. */
1010 SET_DECL_ALIGN (decl, align);
1011 DECL_USER_ALIGN (decl) = 0;
1014 set_rtl (decl, x);
1017 struct stack_vars_data
1019 /* Vector of offset pairs, always end of some padding followed
1020 by start of the padding that needs Address Sanitizer protection.
1021 The vector is in reversed, highest offset pairs come first. */
1022 auto_vec<HOST_WIDE_INT> asan_vec;
1024 /* Vector of partition representative decls in between the paddings. */
1025 auto_vec<tree> asan_decl_vec;
1027 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1028 rtx asan_base;
1030 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1031 unsigned int asan_alignb;
1034 /* A subroutine of expand_used_vars. Give each partition representative
1035 a unique location within the stack frame. Update each partition member
1036 with that location. */
1038 static void
1039 expand_stack_vars (bool (*pred) (size_t), struct stack_vars_data *data)
1041 size_t si, i, j, n = stack_vars_num;
1042 poly_uint64 large_size = 0, large_alloc = 0;
1043 rtx large_base = NULL;
1044 unsigned large_align = 0;
1045 bool large_allocation_done = false;
1046 tree decl;
1048 /* Determine if there are any variables requiring "large" alignment.
1049 Since these are dynamically allocated, we only process these if
1050 no predicate involved. */
1051 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1052 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1054 /* Find the total size of these variables. */
1055 for (si = 0; si < n; ++si)
1057 unsigned alignb;
1059 i = stack_vars_sorted[si];
1060 alignb = stack_vars[i].alignb;
1062 /* All "large" alignment decls come before all "small" alignment
1063 decls, but "large" alignment decls are not sorted based on
1064 their alignment. Increase large_align to track the largest
1065 required alignment. */
1066 if ((alignb * BITS_PER_UNIT) > large_align)
1067 large_align = alignb * BITS_PER_UNIT;
1069 /* Stop when we get to the first decl with "small" alignment. */
1070 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1071 break;
1073 /* Skip variables that aren't partition representatives. */
1074 if (stack_vars[i].representative != i)
1075 continue;
1077 /* Skip variables that have already had rtl assigned. See also
1078 add_stack_var where we perpetrate this pc_rtx hack. */
1079 decl = stack_vars[i].decl;
1080 if (TREE_CODE (decl) == SSA_NAME
1081 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1082 : DECL_RTL (decl) != pc_rtx)
1083 continue;
1085 large_size = aligned_upper_bound (large_size, alignb);
1086 large_size += stack_vars[i].size;
1090 for (si = 0; si < n; ++si)
1092 rtx base;
1093 unsigned base_align, alignb;
1094 poly_int64 offset;
1096 i = stack_vars_sorted[si];
1098 /* Skip variables that aren't partition representatives, for now. */
1099 if (stack_vars[i].representative != i)
1100 continue;
1102 /* Skip variables that have already had rtl assigned. See also
1103 add_stack_var where we perpetrate this pc_rtx hack. */
1104 decl = stack_vars[i].decl;
1105 if (TREE_CODE (decl) == SSA_NAME
1106 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1107 : DECL_RTL (decl) != pc_rtx)
1108 continue;
1110 /* Check the predicate to see whether this variable should be
1111 allocated in this pass. */
1112 if (pred && !pred (i))
1113 continue;
1115 alignb = stack_vars[i].alignb;
1116 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1118 base = virtual_stack_vars_rtx;
1119 /* ASAN description strings don't yet have a syntax for expressing
1120 polynomial offsets. */
1121 HOST_WIDE_INT prev_offset;
1122 if (asan_sanitize_stack_p ()
1123 && pred
1124 && frame_offset.is_constant (&prev_offset)
1125 && stack_vars[i].size.is_constant ())
1127 prev_offset = align_base (prev_offset,
1128 MAX (alignb, ASAN_RED_ZONE_SIZE),
1129 !FRAME_GROWS_DOWNWARD);
1130 tree repr_decl = NULL_TREE;
1131 offset
1132 = alloc_stack_frame_space (stack_vars[i].size
1133 + ASAN_RED_ZONE_SIZE,
1134 MAX (alignb, ASAN_RED_ZONE_SIZE));
1136 data->asan_vec.safe_push (prev_offset);
1137 /* Allocating a constant amount of space from a constant
1138 starting offset must give a constant result. */
1139 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1140 .to_constant ());
1141 /* Find best representative of the partition.
1142 Prefer those with DECL_NAME, even better
1143 satisfying asan_protect_stack_decl predicate. */
1144 for (j = i; j != EOC; j = stack_vars[j].next)
1145 if (asan_protect_stack_decl (stack_vars[j].decl)
1146 && DECL_NAME (stack_vars[j].decl))
1148 repr_decl = stack_vars[j].decl;
1149 break;
1151 else if (repr_decl == NULL_TREE
1152 && DECL_P (stack_vars[j].decl)
1153 && DECL_NAME (stack_vars[j].decl))
1154 repr_decl = stack_vars[j].decl;
1155 if (repr_decl == NULL_TREE)
1156 repr_decl = stack_vars[i].decl;
1157 data->asan_decl_vec.safe_push (repr_decl);
1158 data->asan_alignb = MAX (data->asan_alignb, alignb);
1159 if (data->asan_base == NULL)
1160 data->asan_base = gen_reg_rtx (Pmode);
1161 base = data->asan_base;
1163 if (!STRICT_ALIGNMENT)
1164 base_align = crtl->max_used_stack_slot_alignment;
1165 else
1166 base_align = MAX (crtl->max_used_stack_slot_alignment,
1167 GET_MODE_ALIGNMENT (SImode)
1168 << ASAN_SHADOW_SHIFT);
1170 else
1172 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1173 base_align = crtl->max_used_stack_slot_alignment;
1176 else
1178 /* Large alignment is only processed in the last pass. */
1179 if (pred)
1180 continue;
1182 /* If there were any variables requiring "large" alignment, allocate
1183 space. */
1184 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1186 poly_int64 loffset;
1187 rtx large_allocsize;
1189 large_allocsize = gen_int_mode (large_size, Pmode);
1190 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1191 loffset = alloc_stack_frame_space
1192 (rtx_to_poly_int64 (large_allocsize),
1193 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1194 large_base = get_dynamic_stack_base (loffset, large_align);
1195 large_allocation_done = true;
1197 gcc_assert (large_base != NULL);
1199 large_alloc = aligned_upper_bound (large_alloc, alignb);
1200 offset = large_alloc;
1201 large_alloc += stack_vars[i].size;
1203 base = large_base;
1204 base_align = large_align;
1207 /* Create rtl for each variable based on their location within the
1208 partition. */
1209 for (j = i; j != EOC; j = stack_vars[j].next)
1211 expand_one_stack_var_at (stack_vars[j].decl,
1212 base, base_align,
1213 offset);
1217 gcc_assert (known_eq (large_alloc, large_size));
1220 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1221 static poly_uint64
1222 account_stack_vars (void)
1224 size_t si, j, i, n = stack_vars_num;
1225 poly_uint64 size = 0;
1227 for (si = 0; si < n; ++si)
1229 i = stack_vars_sorted[si];
1231 /* Skip variables that aren't partition representatives, for now. */
1232 if (stack_vars[i].representative != i)
1233 continue;
1235 size += stack_vars[i].size;
1236 for (j = i; j != EOC; j = stack_vars[j].next)
1237 set_rtl (stack_vars[j].decl, NULL);
1239 return size;
1242 /* Record the RTL assignment X for the default def of PARM. */
1244 extern void
1245 set_parm_rtl (tree parm, rtx x)
1247 gcc_assert (TREE_CODE (parm) == PARM_DECL
1248 || TREE_CODE (parm) == RESULT_DECL);
1250 if (x && !MEM_P (x))
1252 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1253 TYPE_MODE (TREE_TYPE (parm)),
1254 TYPE_ALIGN (TREE_TYPE (parm)));
1256 /* If the variable alignment is very large we'll dynamicaly
1257 allocate it, which means that in-frame portion is just a
1258 pointer. ??? We've got a pseudo for sure here, do we
1259 actually dynamically allocate its spilling area if needed?
1260 ??? Isn't it a problem when Pmode alignment also exceeds
1261 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1262 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1263 align = GET_MODE_ALIGNMENT (Pmode);
1265 record_alignment_for_reg_var (align);
1268 tree ssa = ssa_default_def (cfun, parm);
1269 if (!ssa)
1270 return set_rtl (parm, x);
1272 int part = var_to_partition (SA.map, ssa);
1273 gcc_assert (part != NO_PARTITION);
1275 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1276 gcc_assert (changed);
1278 set_rtl (ssa, x);
1279 gcc_assert (DECL_RTL (parm) == x);
1282 /* A subroutine of expand_one_var. Called to immediately assign rtl
1283 to a variable to be allocated in the stack frame. */
1285 static void
1286 expand_one_stack_var_1 (tree var)
1288 poly_uint64 size;
1289 poly_int64 offset;
1290 unsigned byte_align;
1292 if (TREE_CODE (var) == SSA_NAME)
1294 tree type = TREE_TYPE (var);
1295 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1296 byte_align = TYPE_ALIGN_UNIT (type);
1298 else
1300 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1301 byte_align = align_local_variable (var);
1304 /* We handle highly aligned variables in expand_stack_vars. */
1305 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1307 offset = alloc_stack_frame_space (size, byte_align);
1309 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1310 crtl->max_used_stack_slot_alignment, offset);
1313 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1314 already assigned some MEM. */
1316 static void
1317 expand_one_stack_var (tree var)
1319 if (TREE_CODE (var) == SSA_NAME)
1321 int part = var_to_partition (SA.map, var);
1322 if (part != NO_PARTITION)
1324 rtx x = SA.partition_to_pseudo[part];
1325 gcc_assert (x);
1326 gcc_assert (MEM_P (x));
1327 return;
1331 return expand_one_stack_var_1 (var);
1334 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1335 that will reside in a hard register. */
1337 static void
1338 expand_one_hard_reg_var (tree var)
1340 rest_of_decl_compilation (var, 0, 0);
1343 /* Record the alignment requirements of some variable assigned to a
1344 pseudo. */
1346 static void
1347 record_alignment_for_reg_var (unsigned int align)
1349 if (SUPPORTS_STACK_ALIGNMENT
1350 && crtl->stack_alignment_estimated < align)
1352 /* stack_alignment_estimated shouldn't change after stack
1353 realign decision made */
1354 gcc_assert (!crtl->stack_realign_processed);
1355 crtl->stack_alignment_estimated = align;
1358 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1359 So here we only make sure stack_alignment_needed >= align. */
1360 if (crtl->stack_alignment_needed < align)
1361 crtl->stack_alignment_needed = align;
1362 if (crtl->max_used_stack_slot_alignment < align)
1363 crtl->max_used_stack_slot_alignment = align;
1366 /* Create RTL for an SSA partition. */
1368 static void
1369 expand_one_ssa_partition (tree var)
1371 int part = var_to_partition (SA.map, var);
1372 gcc_assert (part != NO_PARTITION);
1374 if (SA.partition_to_pseudo[part])
1375 return;
1377 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1378 TYPE_MODE (TREE_TYPE (var)),
1379 TYPE_ALIGN (TREE_TYPE (var)));
1381 /* If the variable alignment is very large we'll dynamicaly allocate
1382 it, which means that in-frame portion is just a pointer. */
1383 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1384 align = GET_MODE_ALIGNMENT (Pmode);
1386 record_alignment_for_reg_var (align);
1388 if (!use_register_for_decl (var))
1390 if (defer_stack_allocation (var, true))
1391 add_stack_var (var);
1392 else
1393 expand_one_stack_var_1 (var);
1394 return;
1397 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1398 rtx x = gen_reg_rtx (reg_mode);
1400 set_rtl (var, x);
1402 /* For a promoted variable, X will not be used directly but wrapped in a
1403 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1404 will assume that its upper bits can be inferred from its lower bits.
1405 Therefore, if X isn't initialized on every path from the entry, then
1406 we must do it manually in order to fulfill the above assumption. */
1407 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1408 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1409 emit_move_insn (x, CONST0_RTX (reg_mode));
1412 /* Record the association between the RTL generated for partition PART
1413 and the underlying variable of the SSA_NAME VAR. */
1415 static void
1416 adjust_one_expanded_partition_var (tree var)
1418 if (!var)
1419 return;
1421 tree decl = SSA_NAME_VAR (var);
1423 int part = var_to_partition (SA.map, var);
1424 if (part == NO_PARTITION)
1425 return;
1427 rtx x = SA.partition_to_pseudo[part];
1429 gcc_assert (x);
1431 set_rtl (var, x);
1433 if (!REG_P (x))
1434 return;
1436 /* Note if the object is a user variable. */
1437 if (decl && !DECL_ARTIFICIAL (decl))
1438 mark_user_reg (x);
1440 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1441 mark_reg_pointer (x, get_pointer_alignment (var));
1444 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1445 that will reside in a pseudo register. */
1447 static void
1448 expand_one_register_var (tree var)
1450 if (TREE_CODE (var) == SSA_NAME)
1452 int part = var_to_partition (SA.map, var);
1453 if (part != NO_PARTITION)
1455 rtx x = SA.partition_to_pseudo[part];
1456 gcc_assert (x);
1457 gcc_assert (REG_P (x));
1458 return;
1460 gcc_unreachable ();
1463 tree decl = var;
1464 tree type = TREE_TYPE (decl);
1465 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1466 rtx x = gen_reg_rtx (reg_mode);
1468 set_rtl (var, x);
1470 /* Note if the object is a user variable. */
1471 if (!DECL_ARTIFICIAL (decl))
1472 mark_user_reg (x);
1474 if (POINTER_TYPE_P (type))
1475 mark_reg_pointer (x, get_pointer_alignment (var));
1478 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1479 has some associated error, e.g. its type is error-mark. We just need
1480 to pick something that won't crash the rest of the compiler. */
1482 static void
1483 expand_one_error_var (tree var)
1485 machine_mode mode = DECL_MODE (var);
1486 rtx x;
1488 if (mode == BLKmode)
1489 x = gen_rtx_MEM (BLKmode, const0_rtx);
1490 else if (mode == VOIDmode)
1491 x = const0_rtx;
1492 else
1493 x = gen_reg_rtx (mode);
1495 SET_DECL_RTL (var, x);
1498 /* A subroutine of expand_one_var. VAR is a variable that will be
1499 allocated to the local stack frame. Return true if we wish to
1500 add VAR to STACK_VARS so that it will be coalesced with other
1501 variables. Return false to allocate VAR immediately.
1503 This function is used to reduce the number of variables considered
1504 for coalescing, which reduces the size of the quadratic problem. */
1506 static bool
1507 defer_stack_allocation (tree var, bool toplevel)
1509 tree size_unit = TREE_CODE (var) == SSA_NAME
1510 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1511 : DECL_SIZE_UNIT (var);
1512 poly_uint64 size;
1514 /* Whether the variable is small enough for immediate allocation not to be
1515 a problem with regard to the frame size. */
1516 bool smallish
1517 = (poly_int_tree_p (size_unit, &size)
1518 && (estimated_poly_value (size)
1519 < PARAM_VALUE (PARAM_MIN_SIZE_FOR_STACK_SHARING)));
1521 /* If stack protection is enabled, *all* stack variables must be deferred,
1522 so that we can re-order the strings to the top of the frame.
1523 Similarly for Address Sanitizer. */
1524 if (flag_stack_protect || asan_sanitize_stack_p ())
1525 return true;
1527 unsigned int align = TREE_CODE (var) == SSA_NAME
1528 ? TYPE_ALIGN (TREE_TYPE (var))
1529 : DECL_ALIGN (var);
1531 /* We handle "large" alignment via dynamic allocation. We want to handle
1532 this extra complication in only one place, so defer them. */
1533 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1534 return true;
1536 bool ignored = TREE_CODE (var) == SSA_NAME
1537 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1538 : DECL_IGNORED_P (var);
1540 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1541 might be detached from their block and appear at toplevel when we reach
1542 here. We want to coalesce them with variables from other blocks when
1543 the immediate contribution to the frame size would be noticeable. */
1544 if (toplevel && optimize > 0 && ignored && !smallish)
1545 return true;
1547 /* Variables declared in the outermost scope automatically conflict
1548 with every other variable. The only reason to want to defer them
1549 at all is that, after sorting, we can more efficiently pack
1550 small variables in the stack frame. Continue to defer at -O2. */
1551 if (toplevel && optimize < 2)
1552 return false;
1554 /* Without optimization, *most* variables are allocated from the
1555 stack, which makes the quadratic problem large exactly when we
1556 want compilation to proceed as quickly as possible. On the
1557 other hand, we don't want the function's stack frame size to
1558 get completely out of hand. So we avoid adding scalars and
1559 "small" aggregates to the list at all. */
1560 if (optimize == 0 && smallish)
1561 return false;
1563 return true;
1566 /* A subroutine of expand_used_vars. Expand one variable according to
1567 its flavor. Variables to be placed on the stack are not actually
1568 expanded yet, merely recorded.
1569 When REALLY_EXPAND is false, only add stack values to be allocated.
1570 Return stack usage this variable is supposed to take.
1573 static poly_uint64
1574 expand_one_var (tree var, bool toplevel, bool really_expand)
1576 unsigned int align = BITS_PER_UNIT;
1577 tree origvar = var;
1579 var = SSAVAR (var);
1581 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1583 if (is_global_var (var))
1584 return 0;
1586 /* Because we don't know if VAR will be in register or on stack,
1587 we conservatively assume it will be on stack even if VAR is
1588 eventually put into register after RA pass. For non-automatic
1589 variables, which won't be on stack, we collect alignment of
1590 type and ignore user specified alignment. Similarly for
1591 SSA_NAMEs for which use_register_for_decl returns true. */
1592 if (TREE_STATIC (var)
1593 || DECL_EXTERNAL (var)
1594 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1595 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1596 TYPE_MODE (TREE_TYPE (var)),
1597 TYPE_ALIGN (TREE_TYPE (var)));
1598 else if (DECL_HAS_VALUE_EXPR_P (var)
1599 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1600 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1601 or variables which were assigned a stack slot already by
1602 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1603 changed from the offset chosen to it. */
1604 align = crtl->stack_alignment_estimated;
1605 else
1606 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1608 /* If the variable alignment is very large we'll dynamicaly allocate
1609 it, which means that in-frame portion is just a pointer. */
1610 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1611 align = GET_MODE_ALIGNMENT (Pmode);
1614 record_alignment_for_reg_var (align);
1616 poly_uint64 size;
1617 if (TREE_CODE (origvar) == SSA_NAME)
1619 gcc_assert (!VAR_P (var)
1620 || (!DECL_EXTERNAL (var)
1621 && !DECL_HAS_VALUE_EXPR_P (var)
1622 && !TREE_STATIC (var)
1623 && TREE_TYPE (var) != error_mark_node
1624 && !DECL_HARD_REGISTER (var)
1625 && really_expand));
1627 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1629 else if (DECL_EXTERNAL (var))
1631 else if (DECL_HAS_VALUE_EXPR_P (var))
1633 else if (TREE_STATIC (var))
1635 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1637 else if (TREE_TYPE (var) == error_mark_node)
1639 if (really_expand)
1640 expand_one_error_var (var);
1642 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1644 if (really_expand)
1646 expand_one_hard_reg_var (var);
1647 if (!DECL_HARD_REGISTER (var))
1648 /* Invalid register specification. */
1649 expand_one_error_var (var);
1652 else if (use_register_for_decl (var))
1654 if (really_expand)
1655 expand_one_register_var (origvar);
1657 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1658 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1660 /* Reject variables which cover more than half of the address-space. */
1661 if (really_expand)
1663 error ("size of variable %q+D is too large", var);
1664 expand_one_error_var (var);
1667 else if (defer_stack_allocation (var, toplevel))
1668 add_stack_var (origvar);
1669 else
1671 if (really_expand)
1673 if (lookup_attribute ("naked",
1674 DECL_ATTRIBUTES (current_function_decl)))
1675 error ("cannot allocate stack for variable %q+D, naked function.",
1676 var);
1678 expand_one_stack_var (origvar);
1680 return size;
1682 return 0;
1685 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1686 expanding variables. Those variables that can be put into registers
1687 are allocated pseudos; those that can't are put on the stack.
1689 TOPLEVEL is true if this is the outermost BLOCK. */
1691 static void
1692 expand_used_vars_for_block (tree block, bool toplevel)
1694 tree t;
1696 /* Expand all variables at this level. */
1697 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1698 if (TREE_USED (t)
1699 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1700 || !DECL_NONSHAREABLE (t)))
1701 expand_one_var (t, toplevel, true);
1703 /* Expand all variables at containing levels. */
1704 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1705 expand_used_vars_for_block (t, false);
1708 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1709 and clear TREE_USED on all local variables. */
1711 static void
1712 clear_tree_used (tree block)
1714 tree t;
1716 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1717 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1718 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1719 || !DECL_NONSHAREABLE (t))
1720 TREE_USED (t) = 0;
1722 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1723 clear_tree_used (t);
1726 enum {
1727 SPCT_FLAG_DEFAULT = 1,
1728 SPCT_FLAG_ALL = 2,
1729 SPCT_FLAG_STRONG = 3,
1730 SPCT_FLAG_EXPLICIT = 4
1733 /* Examine TYPE and determine a bit mask of the following features. */
1735 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1736 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1737 #define SPCT_HAS_ARRAY 4
1738 #define SPCT_HAS_AGGREGATE 8
1740 static unsigned int
1741 stack_protect_classify_type (tree type)
1743 unsigned int ret = 0;
1744 tree t;
1746 switch (TREE_CODE (type))
1748 case ARRAY_TYPE:
1749 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1750 if (t == char_type_node
1751 || t == signed_char_type_node
1752 || t == unsigned_char_type_node)
1754 unsigned HOST_WIDE_INT max = PARAM_VALUE (PARAM_SSP_BUFFER_SIZE);
1755 unsigned HOST_WIDE_INT len;
1757 if (!TYPE_SIZE_UNIT (type)
1758 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1759 len = max;
1760 else
1761 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1763 if (len < max)
1764 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1765 else
1766 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1768 else
1769 ret = SPCT_HAS_ARRAY;
1770 break;
1772 case UNION_TYPE:
1773 case QUAL_UNION_TYPE:
1774 case RECORD_TYPE:
1775 ret = SPCT_HAS_AGGREGATE;
1776 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1777 if (TREE_CODE (t) == FIELD_DECL)
1778 ret |= stack_protect_classify_type (TREE_TYPE (t));
1779 break;
1781 default:
1782 break;
1785 return ret;
1788 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1789 part of the local stack frame. Remember if we ever return nonzero for
1790 any variable in this function. The return value is the phase number in
1791 which the variable should be allocated. */
1793 static int
1794 stack_protect_decl_phase (tree decl)
1796 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1797 int ret = 0;
1799 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1800 has_short_buffer = true;
1802 if (flag_stack_protect == SPCT_FLAG_ALL
1803 || flag_stack_protect == SPCT_FLAG_STRONG
1804 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1805 && lookup_attribute ("stack_protect",
1806 DECL_ATTRIBUTES (current_function_decl))))
1808 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1809 && !(bits & SPCT_HAS_AGGREGATE))
1810 ret = 1;
1811 else if (bits & SPCT_HAS_ARRAY)
1812 ret = 2;
1814 else
1815 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1817 if (ret)
1818 has_protected_decls = true;
1820 return ret;
1823 /* Two helper routines that check for phase 1 and phase 2. These are used
1824 as callbacks for expand_stack_vars. */
1826 static bool
1827 stack_protect_decl_phase_1 (size_t i)
1829 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1832 static bool
1833 stack_protect_decl_phase_2 (size_t i)
1835 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1838 /* And helper function that checks for asan phase (with stack protector
1839 it is phase 3). This is used as callback for expand_stack_vars.
1840 Returns true if any of the vars in the partition need to be protected. */
1842 static bool
1843 asan_decl_phase_3 (size_t i)
1845 while (i != EOC)
1847 if (asan_protect_stack_decl (stack_vars[i].decl))
1848 return true;
1849 i = stack_vars[i].next;
1851 return false;
1854 /* Ensure that variables in different stack protection phases conflict
1855 so that they are not merged and share the same stack slot. */
1857 static void
1858 add_stack_protection_conflicts (void)
1860 size_t i, j, n = stack_vars_num;
1861 unsigned char *phase;
1863 phase = XNEWVEC (unsigned char, n);
1864 for (i = 0; i < n; ++i)
1865 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1867 for (i = 0; i < n; ++i)
1869 unsigned char ph_i = phase[i];
1870 for (j = i + 1; j < n; ++j)
1871 if (ph_i != phase[j])
1872 add_stack_var_conflict (i, j);
1875 XDELETEVEC (phase);
1878 /* Create a decl for the guard at the top of the stack frame. */
1880 static void
1881 create_stack_guard (void)
1883 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1884 VAR_DECL, NULL, ptr_type_node);
1885 TREE_THIS_VOLATILE (guard) = 1;
1886 TREE_USED (guard) = 1;
1887 expand_one_stack_var (guard);
1888 crtl->stack_protect_guard = guard;
1891 /* Prepare for expanding variables. */
1892 static void
1893 init_vars_expansion (void)
1895 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1896 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1898 /* A map from decl to stack partition. */
1899 decl_to_stack_part = new hash_map<tree, size_t>;
1901 /* Initialize local stack smashing state. */
1902 has_protected_decls = false;
1903 has_short_buffer = false;
1906 /* Free up stack variable graph data. */
1907 static void
1908 fini_vars_expansion (void)
1910 bitmap_obstack_release (&stack_var_bitmap_obstack);
1911 if (stack_vars)
1912 XDELETEVEC (stack_vars);
1913 if (stack_vars_sorted)
1914 XDELETEVEC (stack_vars_sorted);
1915 stack_vars = NULL;
1916 stack_vars_sorted = NULL;
1917 stack_vars_alloc = stack_vars_num = 0;
1918 delete decl_to_stack_part;
1919 decl_to_stack_part = NULL;
1922 /* Make a fair guess for the size of the stack frame of the function
1923 in NODE. This doesn't have to be exact, the result is only used in
1924 the inline heuristics. So we don't want to run the full stack var
1925 packing algorithm (which is quadratic in the number of stack vars).
1926 Instead, we calculate the total size of all stack vars. This turns
1927 out to be a pretty fair estimate -- packing of stack vars doesn't
1928 happen very often. */
1930 HOST_WIDE_INT
1931 estimated_stack_frame_size (struct cgraph_node *node)
1933 poly_int64 size = 0;
1934 size_t i;
1935 tree var;
1936 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1938 push_cfun (fn);
1940 init_vars_expansion ();
1942 FOR_EACH_LOCAL_DECL (fn, i, var)
1943 if (auto_var_in_fn_p (var, fn->decl))
1944 size += expand_one_var (var, true, false);
1946 if (stack_vars_num > 0)
1948 /* Fake sorting the stack vars for account_stack_vars (). */
1949 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1950 for (i = 0; i < stack_vars_num; ++i)
1951 stack_vars_sorted[i] = i;
1952 size += account_stack_vars ();
1955 fini_vars_expansion ();
1956 pop_cfun ();
1957 return estimated_poly_value (size);
1960 /* Helper routine to check if a record or union contains an array field. */
1962 static int
1963 record_or_union_type_has_array_p (const_tree tree_type)
1965 tree fields = TYPE_FIELDS (tree_type);
1966 tree f;
1968 for (f = fields; f; f = DECL_CHAIN (f))
1969 if (TREE_CODE (f) == FIELD_DECL)
1971 tree field_type = TREE_TYPE (f);
1972 if (RECORD_OR_UNION_TYPE_P (field_type)
1973 && record_or_union_type_has_array_p (field_type))
1974 return 1;
1975 if (TREE_CODE (field_type) == ARRAY_TYPE)
1976 return 1;
1978 return 0;
1981 /* Check if the current function has local referenced variables that
1982 have their addresses taken, contain an array, or are arrays. */
1984 static bool
1985 stack_protect_decl_p ()
1987 unsigned i;
1988 tree var;
1990 FOR_EACH_LOCAL_DECL (cfun, i, var)
1991 if (!is_global_var (var))
1993 tree var_type = TREE_TYPE (var);
1994 if (VAR_P (var)
1995 && (TREE_CODE (var_type) == ARRAY_TYPE
1996 || TREE_ADDRESSABLE (var)
1997 || (RECORD_OR_UNION_TYPE_P (var_type)
1998 && record_or_union_type_has_array_p (var_type))))
1999 return true;
2001 return false;
2004 /* Check if the current function has calls that use a return slot. */
2006 static bool
2007 stack_protect_return_slot_p ()
2009 basic_block bb;
2011 FOR_ALL_BB_FN (bb, cfun)
2012 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2013 !gsi_end_p (gsi); gsi_next (&gsi))
2015 gimple *stmt = gsi_stmt (gsi);
2016 /* This assumes that calls to internal-only functions never
2017 use a return slot. */
2018 if (is_gimple_call (stmt)
2019 && !gimple_call_internal_p (stmt)
2020 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2021 gimple_call_fndecl (stmt)))
2022 return true;
2024 return false;
2027 /* Expand all variables used in the function. */
2029 static rtx_insn *
2030 expand_used_vars (void)
2032 tree var, outer_block = DECL_INITIAL (current_function_decl);
2033 auto_vec<tree> maybe_local_decls;
2034 rtx_insn *var_end_seq = NULL;
2035 unsigned i;
2036 unsigned len;
2037 bool gen_stack_protect_signal = false;
2039 /* Compute the phase of the stack frame for this function. */
2041 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2042 int off = targetm.starting_frame_offset () % align;
2043 frame_phase = off ? align - off : 0;
2046 /* Set TREE_USED on all variables in the local_decls. */
2047 FOR_EACH_LOCAL_DECL (cfun, i, var)
2048 TREE_USED (var) = 1;
2049 /* Clear TREE_USED on all variables associated with a block scope. */
2050 clear_tree_used (DECL_INITIAL (current_function_decl));
2052 init_vars_expansion ();
2054 if (targetm.use_pseudo_pic_reg ())
2055 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2057 for (i = 0; i < SA.map->num_partitions; i++)
2059 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2060 continue;
2062 tree var = partition_to_var (SA.map, i);
2064 gcc_assert (!virtual_operand_p (var));
2066 expand_one_ssa_partition (var);
2069 if (flag_stack_protect == SPCT_FLAG_STRONG)
2070 gen_stack_protect_signal
2071 = stack_protect_decl_p () || stack_protect_return_slot_p ();
2073 /* At this point all variables on the local_decls with TREE_USED
2074 set are not associated with any block scope. Lay them out. */
2076 len = vec_safe_length (cfun->local_decls);
2077 FOR_EACH_LOCAL_DECL (cfun, i, var)
2079 bool expand_now = false;
2081 /* Expanded above already. */
2082 if (is_gimple_reg (var))
2084 TREE_USED (var) = 0;
2085 goto next;
2087 /* We didn't set a block for static or extern because it's hard
2088 to tell the difference between a global variable (re)declared
2089 in a local scope, and one that's really declared there to
2090 begin with. And it doesn't really matter much, since we're
2091 not giving them stack space. Expand them now. */
2092 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2093 expand_now = true;
2095 /* Expand variables not associated with any block now. Those created by
2096 the optimizers could be live anywhere in the function. Those that
2097 could possibly have been scoped originally and detached from their
2098 block will have their allocation deferred so we coalesce them with
2099 others when optimization is enabled. */
2100 else if (TREE_USED (var))
2101 expand_now = true;
2103 /* Finally, mark all variables on the list as used. We'll use
2104 this in a moment when we expand those associated with scopes. */
2105 TREE_USED (var) = 1;
2107 if (expand_now)
2108 expand_one_var (var, true, true);
2110 next:
2111 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2113 rtx rtl = DECL_RTL_IF_SET (var);
2115 /* Keep artificial non-ignored vars in cfun->local_decls
2116 chain until instantiate_decls. */
2117 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2118 add_local_decl (cfun, var);
2119 else if (rtl == NULL_RTX)
2120 /* If rtl isn't set yet, which can happen e.g. with
2121 -fstack-protector, retry before returning from this
2122 function. */
2123 maybe_local_decls.safe_push (var);
2127 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2129 +-----------------+-----------------+
2130 | ...processed... | ...duplicates...|
2131 +-----------------+-----------------+
2133 +-- LEN points here.
2135 We just want the duplicates, as those are the artificial
2136 non-ignored vars that we want to keep until instantiate_decls.
2137 Move them down and truncate the array. */
2138 if (!vec_safe_is_empty (cfun->local_decls))
2139 cfun->local_decls->block_remove (0, len);
2141 /* At this point, all variables within the block tree with TREE_USED
2142 set are actually used by the optimized function. Lay them out. */
2143 expand_used_vars_for_block (outer_block, true);
2145 if (stack_vars_num > 0)
2147 add_scope_conflicts ();
2149 /* If stack protection is enabled, we don't share space between
2150 vulnerable data and non-vulnerable data. */
2151 if (flag_stack_protect != 0
2152 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2153 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2154 && lookup_attribute ("stack_protect",
2155 DECL_ATTRIBUTES (current_function_decl)))))
2156 add_stack_protection_conflicts ();
2158 /* Now that we have collected all stack variables, and have computed a
2159 minimal interference graph, attempt to save some stack space. */
2160 partition_stack_vars ();
2161 if (dump_file)
2162 dump_stack_var_partition ();
2165 switch (flag_stack_protect)
2167 case SPCT_FLAG_ALL:
2168 create_stack_guard ();
2169 break;
2171 case SPCT_FLAG_STRONG:
2172 if (gen_stack_protect_signal
2173 || cfun->calls_alloca || has_protected_decls
2174 || lookup_attribute ("stack_protect",
2175 DECL_ATTRIBUTES (current_function_decl)))
2176 create_stack_guard ();
2177 break;
2179 case SPCT_FLAG_DEFAULT:
2180 if (cfun->calls_alloca || has_protected_decls
2181 || lookup_attribute ("stack_protect",
2182 DECL_ATTRIBUTES (current_function_decl)))
2183 create_stack_guard ();
2184 break;
2186 case SPCT_FLAG_EXPLICIT:
2187 if (lookup_attribute ("stack_protect",
2188 DECL_ATTRIBUTES (current_function_decl)))
2189 create_stack_guard ();
2190 break;
2191 default:
2195 /* Assign rtl to each variable based on these partitions. */
2196 if (stack_vars_num > 0)
2198 struct stack_vars_data data;
2200 data.asan_base = NULL_RTX;
2201 data.asan_alignb = 0;
2203 /* Reorder decls to be protected by iterating over the variables
2204 array multiple times, and allocating out of each phase in turn. */
2205 /* ??? We could probably integrate this into the qsort we did
2206 earlier, such that we naturally see these variables first,
2207 and thus naturally allocate things in the right order. */
2208 if (has_protected_decls)
2210 /* Phase 1 contains only character arrays. */
2211 expand_stack_vars (stack_protect_decl_phase_1, &data);
2213 /* Phase 2 contains other kinds of arrays. */
2214 if (flag_stack_protect == SPCT_FLAG_ALL
2215 || flag_stack_protect == SPCT_FLAG_STRONG
2216 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2217 && lookup_attribute ("stack_protect",
2218 DECL_ATTRIBUTES (current_function_decl))))
2219 expand_stack_vars (stack_protect_decl_phase_2, &data);
2222 if (asan_sanitize_stack_p ())
2223 /* Phase 3, any partitions that need asan protection
2224 in addition to phase 1 and 2. */
2225 expand_stack_vars (asan_decl_phase_3, &data);
2227 /* ASAN description strings don't yet have a syntax for expressing
2228 polynomial offsets. */
2229 HOST_WIDE_INT prev_offset;
2230 if (!data.asan_vec.is_empty ()
2231 && frame_offset.is_constant (&prev_offset))
2233 HOST_WIDE_INT offset, sz, redzonesz;
2234 redzonesz = ASAN_RED_ZONE_SIZE;
2235 sz = data.asan_vec[0] - prev_offset;
2236 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2237 && data.asan_alignb <= 4096
2238 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2239 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2240 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2241 /* Allocating a constant amount of space from a constant
2242 starting offset must give a constant result. */
2243 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2244 .to_constant ());
2245 data.asan_vec.safe_push (prev_offset);
2246 data.asan_vec.safe_push (offset);
2247 /* Leave space for alignment if STRICT_ALIGNMENT. */
2248 if (STRICT_ALIGNMENT)
2249 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2250 << ASAN_SHADOW_SHIFT)
2251 / BITS_PER_UNIT, 1);
2253 var_end_seq
2254 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2255 data.asan_base,
2256 data.asan_alignb,
2257 data.asan_vec.address (),
2258 data.asan_decl_vec.address (),
2259 data.asan_vec.length ());
2262 expand_stack_vars (NULL, &data);
2265 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2266 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2267 virtual_stack_vars_rtx,
2268 var_end_seq);
2270 fini_vars_expansion ();
2272 /* If there were any artificial non-ignored vars without rtl
2273 found earlier, see if deferred stack allocation hasn't assigned
2274 rtl to them. */
2275 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2277 rtx rtl = DECL_RTL_IF_SET (var);
2279 /* Keep artificial non-ignored vars in cfun->local_decls
2280 chain until instantiate_decls. */
2281 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2282 add_local_decl (cfun, var);
2285 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2286 if (STACK_ALIGNMENT_NEEDED)
2288 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2289 if (FRAME_GROWS_DOWNWARD)
2290 frame_offset = aligned_lower_bound (frame_offset, align);
2291 else
2292 frame_offset = aligned_upper_bound (frame_offset, align);
2295 return var_end_seq;
2299 /* If we need to produce a detailed dump, print the tree representation
2300 for STMT to the dump file. SINCE is the last RTX after which the RTL
2301 generated for STMT should have been appended. */
2303 static void
2304 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2306 if (dump_file && (dump_flags & TDF_DETAILS))
2308 fprintf (dump_file, "\n;; ");
2309 print_gimple_stmt (dump_file, stmt, 0,
2310 TDF_SLIM | (dump_flags & TDF_LINENO));
2311 fprintf (dump_file, "\n");
2313 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2317 /* Maps the blocks that do not contain tree labels to rtx labels. */
2319 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2321 /* Returns the label_rtx expression for a label starting basic block BB. */
2323 static rtx_code_label *
2324 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2326 gimple_stmt_iterator gsi;
2327 tree lab;
2329 if (bb->flags & BB_RTL)
2330 return block_label (bb);
2332 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2333 if (elt)
2334 return *elt;
2336 /* Find the tree label if it is present. */
2338 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2340 glabel *lab_stmt;
2342 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2343 if (!lab_stmt)
2344 break;
2346 lab = gimple_label_label (lab_stmt);
2347 if (DECL_NONLOCAL (lab))
2348 break;
2350 return jump_target_rtx (lab);
2353 rtx_code_label *l = gen_label_rtx ();
2354 lab_rtx_for_bb->put (bb, l);
2355 return l;
2359 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2360 of a basic block where we just expanded the conditional at the end,
2361 possibly clean up the CFG and instruction sequence. LAST is the
2362 last instruction before the just emitted jump sequence. */
2364 static void
2365 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2367 /* Special case: when jumpif decides that the condition is
2368 trivial it emits an unconditional jump (and the necessary
2369 barrier). But we still have two edges, the fallthru one is
2370 wrong. purge_dead_edges would clean this up later. Unfortunately
2371 we have to insert insns (and split edges) before
2372 find_many_sub_basic_blocks and hence before purge_dead_edges.
2373 But splitting edges might create new blocks which depend on the
2374 fact that if there are two edges there's no barrier. So the
2375 barrier would get lost and verify_flow_info would ICE. Instead
2376 of auditing all edge splitters to care for the barrier (which
2377 normally isn't there in a cleaned CFG), fix it here. */
2378 if (BARRIER_P (get_last_insn ()))
2380 rtx_insn *insn;
2381 remove_edge (e);
2382 /* Now, we have a single successor block, if we have insns to
2383 insert on the remaining edge we potentially will insert
2384 it at the end of this block (if the dest block isn't feasible)
2385 in order to avoid splitting the edge. This insertion will take
2386 place in front of the last jump. But we might have emitted
2387 multiple jumps (conditional and one unconditional) to the
2388 same destination. Inserting in front of the last one then
2389 is a problem. See PR 40021. We fix this by deleting all
2390 jumps except the last unconditional one. */
2391 insn = PREV_INSN (get_last_insn ());
2392 /* Make sure we have an unconditional jump. Otherwise we're
2393 confused. */
2394 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2395 for (insn = PREV_INSN (insn); insn != last;)
2397 insn = PREV_INSN (insn);
2398 if (JUMP_P (NEXT_INSN (insn)))
2400 if (!any_condjump_p (NEXT_INSN (insn)))
2402 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2403 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2405 delete_insn (NEXT_INSN (insn));
2411 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2412 Returns a new basic block if we've terminated the current basic
2413 block and created a new one. */
2415 static basic_block
2416 expand_gimple_cond (basic_block bb, gcond *stmt)
2418 basic_block new_bb, dest;
2419 edge true_edge;
2420 edge false_edge;
2421 rtx_insn *last2, *last;
2422 enum tree_code code;
2423 tree op0, op1;
2425 code = gimple_cond_code (stmt);
2426 op0 = gimple_cond_lhs (stmt);
2427 op1 = gimple_cond_rhs (stmt);
2428 /* We're sometimes presented with such code:
2429 D.123_1 = x < y;
2430 if (D.123_1 != 0)
2432 This would expand to two comparisons which then later might
2433 be cleaned up by combine. But some pattern matchers like if-conversion
2434 work better when there's only one compare, so make up for this
2435 here as special exception if TER would have made the same change. */
2436 if (SA.values
2437 && TREE_CODE (op0) == SSA_NAME
2438 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2439 && TREE_CODE (op1) == INTEGER_CST
2440 && ((gimple_cond_code (stmt) == NE_EXPR
2441 && integer_zerop (op1))
2442 || (gimple_cond_code (stmt) == EQ_EXPR
2443 && integer_onep (op1)))
2444 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2446 gimple *second = SSA_NAME_DEF_STMT (op0);
2447 if (gimple_code (second) == GIMPLE_ASSIGN)
2449 enum tree_code code2 = gimple_assign_rhs_code (second);
2450 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2452 code = code2;
2453 op0 = gimple_assign_rhs1 (second);
2454 op1 = gimple_assign_rhs2 (second);
2456 /* If jumps are cheap and the target does not support conditional
2457 compare, turn some more codes into jumpy sequences. */
2458 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2459 && targetm.gen_ccmp_first == NULL)
2461 if ((code2 == BIT_AND_EXPR
2462 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2463 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2464 || code2 == TRUTH_AND_EXPR)
2466 code = TRUTH_ANDIF_EXPR;
2467 op0 = gimple_assign_rhs1 (second);
2468 op1 = gimple_assign_rhs2 (second);
2470 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2472 code = TRUTH_ORIF_EXPR;
2473 op0 = gimple_assign_rhs1 (second);
2474 op1 = gimple_assign_rhs2 (second);
2480 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2481 into (x - C2) * C3 < C4. */
2482 if ((code == EQ_EXPR || code == NE_EXPR)
2483 && TREE_CODE (op0) == SSA_NAME
2484 && TREE_CODE (op1) == INTEGER_CST)
2485 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2487 last2 = last = get_last_insn ();
2489 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2490 set_curr_insn_location (gimple_location (stmt));
2492 /* These flags have no purpose in RTL land. */
2493 true_edge->flags &= ~EDGE_TRUE_VALUE;
2494 false_edge->flags &= ~EDGE_FALSE_VALUE;
2496 /* We can either have a pure conditional jump with one fallthru edge or
2497 two-way jump that needs to be decomposed into two basic blocks. */
2498 if (false_edge->dest == bb->next_bb)
2500 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2501 true_edge->probability);
2502 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2503 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2504 set_curr_insn_location (true_edge->goto_locus);
2505 false_edge->flags |= EDGE_FALLTHRU;
2506 maybe_cleanup_end_of_block (false_edge, last);
2507 return NULL;
2509 if (true_edge->dest == bb->next_bb)
2511 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2512 false_edge->probability);
2513 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2514 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2515 set_curr_insn_location (false_edge->goto_locus);
2516 true_edge->flags |= EDGE_FALLTHRU;
2517 maybe_cleanup_end_of_block (true_edge, last);
2518 return NULL;
2521 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2522 true_edge->probability);
2523 last = get_last_insn ();
2524 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2525 set_curr_insn_location (false_edge->goto_locus);
2526 emit_jump (label_rtx_for_bb (false_edge->dest));
2528 BB_END (bb) = last;
2529 if (BARRIER_P (BB_END (bb)))
2530 BB_END (bb) = PREV_INSN (BB_END (bb));
2531 update_bb_for_insn (bb);
2533 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2534 dest = false_edge->dest;
2535 redirect_edge_succ (false_edge, new_bb);
2536 false_edge->flags |= EDGE_FALLTHRU;
2537 new_bb->count = false_edge->count ();
2538 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2539 add_bb_to_loop (new_bb, loop);
2540 if (loop->latch == bb
2541 && loop->header == dest)
2542 loop->latch = new_bb;
2543 make_single_succ_edge (new_bb, dest, 0);
2544 if (BARRIER_P (BB_END (new_bb)))
2545 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2546 update_bb_for_insn (new_bb);
2548 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2550 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2552 set_curr_insn_location (true_edge->goto_locus);
2553 true_edge->goto_locus = curr_insn_location ();
2556 return new_bb;
2559 /* Mark all calls that can have a transaction restart. */
2561 static void
2562 mark_transaction_restart_calls (gimple *stmt)
2564 struct tm_restart_node dummy;
2565 tm_restart_node **slot;
2567 if (!cfun->gimple_df->tm_restart)
2568 return;
2570 dummy.stmt = stmt;
2571 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2572 if (slot)
2574 struct tm_restart_node *n = *slot;
2575 tree list = n->label_or_list;
2576 rtx_insn *insn;
2578 for (insn = next_real_insn (get_last_insn ());
2579 !CALL_P (insn);
2580 insn = next_real_insn (insn))
2581 continue;
2583 if (TREE_CODE (list) == LABEL_DECL)
2584 add_reg_note (insn, REG_TM, label_rtx (list));
2585 else
2586 for (; list ; list = TREE_CHAIN (list))
2587 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2591 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2592 statement STMT. */
2594 static void
2595 expand_call_stmt (gcall *stmt)
2597 tree exp, decl, lhs;
2598 bool builtin_p;
2599 size_t i;
2601 if (gimple_call_internal_p (stmt))
2603 expand_internal_call (stmt);
2604 return;
2607 /* If this is a call to a built-in function and it has no effect other
2608 than setting the lhs, try to implement it using an internal function
2609 instead. */
2610 decl = gimple_call_fndecl (stmt);
2611 if (gimple_call_lhs (stmt)
2612 && !gimple_has_side_effects (stmt)
2613 && (optimize || (decl && called_as_built_in (decl))))
2615 internal_fn ifn = replacement_internal_fn (stmt);
2616 if (ifn != IFN_LAST)
2618 expand_internal_call (ifn, stmt);
2619 return;
2623 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2625 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2626 builtin_p = decl && fndecl_built_in_p (decl);
2628 /* If this is not a builtin function, the function type through which the
2629 call is made may be different from the type of the function. */
2630 if (!builtin_p)
2631 CALL_EXPR_FN (exp)
2632 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2633 CALL_EXPR_FN (exp));
2635 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2636 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2638 for (i = 0; i < gimple_call_num_args (stmt); i++)
2640 tree arg = gimple_call_arg (stmt, i);
2641 gimple *def;
2642 /* TER addresses into arguments of builtin functions so we have a
2643 chance to infer more correct alignment information. See PR39954. */
2644 if (builtin_p
2645 && TREE_CODE (arg) == SSA_NAME
2646 && (def = get_gimple_for_ssa_name (arg))
2647 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2648 arg = gimple_assign_rhs1 (def);
2649 CALL_EXPR_ARG (exp, i) = arg;
2652 if (gimple_has_side_effects (stmt))
2653 TREE_SIDE_EFFECTS (exp) = 1;
2655 if (gimple_call_nothrow_p (stmt))
2656 TREE_NOTHROW (exp) = 1;
2658 if (gimple_no_warning_p (stmt))
2659 TREE_NO_WARNING (exp) = 1;
2661 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2662 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2663 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2664 if (decl
2665 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2666 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2667 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2668 else
2669 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2670 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2671 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2672 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2674 /* Ensure RTL is created for debug args. */
2675 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2677 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2678 unsigned int ix;
2679 tree dtemp;
2681 if (debug_args)
2682 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2684 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2685 expand_debug_expr (dtemp);
2689 rtx_insn *before_call = get_last_insn ();
2690 lhs = gimple_call_lhs (stmt);
2691 if (lhs)
2692 expand_assignment (lhs, exp, false);
2693 else
2694 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2696 /* If the gimple call is an indirect call and has 'nocf_check'
2697 attribute find a generated CALL insn to mark it as no
2698 control-flow verification is needed. */
2699 if (gimple_call_nocf_check_p (stmt)
2700 && !gimple_call_fndecl (stmt))
2702 rtx_insn *last = get_last_insn ();
2703 while (!CALL_P (last)
2704 && last != before_call)
2705 last = PREV_INSN (last);
2707 if (last != before_call)
2708 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2711 mark_transaction_restart_calls (stmt);
2715 /* Generate RTL for an asm statement (explicit assembler code).
2716 STRING is a STRING_CST node containing the assembler code text,
2717 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2718 insn is volatile; don't optimize it. */
2720 static void
2721 expand_asm_loc (tree string, int vol, location_t locus)
2723 rtx body;
2725 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2726 ggc_strdup (TREE_STRING_POINTER (string)),
2727 locus);
2729 MEM_VOLATILE_P (body) = vol;
2731 /* Non-empty basic ASM implicitly clobbers memory. */
2732 if (TREE_STRING_LENGTH (string) != 0)
2734 rtx asm_op, clob;
2735 unsigned i, nclobbers;
2736 auto_vec<rtx> input_rvec, output_rvec;
2737 auto_vec<const char *> constraints;
2738 auto_vec<rtx> clobber_rvec;
2739 HARD_REG_SET clobbered_regs;
2740 CLEAR_HARD_REG_SET (clobbered_regs);
2742 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2743 clobber_rvec.safe_push (clob);
2745 if (targetm.md_asm_adjust)
2746 targetm.md_asm_adjust (output_rvec, input_rvec,
2747 constraints, clobber_rvec,
2748 clobbered_regs);
2750 asm_op = body;
2751 nclobbers = clobber_rvec.length ();
2752 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nclobbers));
2754 XVECEXP (body, 0, 0) = asm_op;
2755 for (i = 0; i < nclobbers; i++)
2756 XVECEXP (body, 0, i + 1) = gen_rtx_CLOBBER (VOIDmode, clobber_rvec[i]);
2759 emit_insn (body);
2762 /* Return the number of times character C occurs in string S. */
2763 static int
2764 n_occurrences (int c, const char *s)
2766 int n = 0;
2767 while (*s)
2768 n += (*s++ == c);
2769 return n;
2772 /* A subroutine of expand_asm_operands. Check that all operands have
2773 the same number of alternatives. Return true if so. */
2775 static bool
2776 check_operand_nalternatives (const vec<const char *> &constraints)
2778 unsigned len = constraints.length();
2779 if (len > 0)
2781 int nalternatives = n_occurrences (',', constraints[0]);
2783 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2785 error ("too many alternatives in %<asm%>");
2786 return false;
2789 for (unsigned i = 1; i < len; ++i)
2790 if (n_occurrences (',', constraints[i]) != nalternatives)
2792 error ("operand constraints for %<asm%> differ "
2793 "in number of alternatives");
2794 return false;
2797 return true;
2800 /* Check for overlap between registers marked in CLOBBERED_REGS and
2801 anything inappropriate in T. Emit error and return the register
2802 variable definition for error, NULL_TREE for ok. */
2804 static bool
2805 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2807 /* Conflicts between asm-declared register variables and the clobber
2808 list are not allowed. */
2809 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2811 if (overlap)
2813 error ("asm-specifier for variable %qE conflicts with asm clobber list",
2814 DECL_NAME (overlap));
2816 /* Reset registerness to stop multiple errors emitted for a single
2817 variable. */
2818 DECL_REGISTER (overlap) = 0;
2819 return true;
2822 return false;
2825 /* Generate RTL for an asm statement with arguments.
2826 STRING is the instruction template.
2827 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2828 Each output or input has an expression in the TREE_VALUE and
2829 a tree list in TREE_PURPOSE which in turn contains a constraint
2830 name in TREE_VALUE (or NULL_TREE) and a constraint string
2831 in TREE_PURPOSE.
2832 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2833 that is clobbered by this insn.
2835 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2836 should be the fallthru basic block of the asm goto.
2838 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2839 Some elements of OUTPUTS may be replaced with trees representing temporary
2840 values. The caller should copy those temporary values to the originally
2841 specified lvalues.
2843 VOL nonzero means the insn is volatile; don't optimize it. */
2845 static void
2846 expand_asm_stmt (gasm *stmt)
2848 class save_input_location
2850 location_t old;
2852 public:
2853 explicit save_input_location(location_t where)
2855 old = input_location;
2856 input_location = where;
2859 ~save_input_location()
2861 input_location = old;
2865 location_t locus = gimple_location (stmt);
2867 if (gimple_asm_input_p (stmt))
2869 const char *s = gimple_asm_string (stmt);
2870 tree string = build_string (strlen (s), s);
2871 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
2872 return;
2875 /* There are some legacy diagnostics in here, and also avoids a
2876 sixth parameger to targetm.md_asm_adjust. */
2877 save_input_location s_i_l(locus);
2879 unsigned noutputs = gimple_asm_noutputs (stmt);
2880 unsigned ninputs = gimple_asm_ninputs (stmt);
2881 unsigned nlabels = gimple_asm_nlabels (stmt);
2882 unsigned i;
2884 /* ??? Diagnose during gimplification? */
2885 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
2887 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2888 return;
2891 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
2892 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
2893 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
2895 /* Copy the gimple vectors into new vectors that we can manipulate. */
2897 output_tvec.safe_grow (noutputs);
2898 input_tvec.safe_grow (ninputs);
2899 constraints.safe_grow (noutputs + ninputs);
2901 for (i = 0; i < noutputs; ++i)
2903 tree t = gimple_asm_output_op (stmt, i);
2904 output_tvec[i] = TREE_VALUE (t);
2905 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2907 for (i = 0; i < ninputs; i++)
2909 tree t = gimple_asm_input_op (stmt, i);
2910 input_tvec[i] = TREE_VALUE (t);
2911 constraints[i + noutputs]
2912 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2915 /* ??? Diagnose during gimplification? */
2916 if (! check_operand_nalternatives (constraints))
2917 return;
2919 /* Count the number of meaningful clobbered registers, ignoring what
2920 we would ignore later. */
2921 auto_vec<rtx> clobber_rvec;
2922 HARD_REG_SET clobbered_regs;
2923 CLEAR_HARD_REG_SET (clobbered_regs);
2925 if (unsigned n = gimple_asm_nclobbers (stmt))
2927 clobber_rvec.reserve (n);
2928 for (i = 0; i < n; i++)
2930 tree t = gimple_asm_clobber_op (stmt, i);
2931 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
2932 int nregs, j;
2934 j = decode_reg_name_and_count (regname, &nregs);
2935 if (j < 0)
2937 if (j == -2)
2939 /* ??? Diagnose during gimplification? */
2940 error ("unknown register name %qs in %<asm%>", regname);
2942 else if (j == -4)
2944 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2945 clobber_rvec.safe_push (x);
2947 else
2949 /* Otherwise we should have -1 == empty string
2950 or -3 == cc, which is not a register. */
2951 gcc_assert (j == -1 || j == -3);
2954 else
2955 for (int reg = j; reg < j + nregs; reg++)
2957 /* Clobbering the PIC register is an error. */
2958 if (reg == (int) PIC_OFFSET_TABLE_REGNUM)
2960 /* ??? Diagnose during gimplification? */
2961 error ("PIC register clobbered by %qs in %<asm%>",
2962 regname);
2963 return;
2966 SET_HARD_REG_BIT (clobbered_regs, reg);
2967 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
2968 clobber_rvec.safe_push (x);
2972 unsigned nclobbers = clobber_rvec.length();
2974 /* First pass over inputs and outputs checks validity and sets
2975 mark_addressable if needed. */
2976 /* ??? Diagnose during gimplification? */
2978 for (i = 0; i < noutputs; ++i)
2980 tree val = output_tvec[i];
2981 tree type = TREE_TYPE (val);
2982 const char *constraint;
2983 bool is_inout;
2984 bool allows_reg;
2985 bool allows_mem;
2987 /* Try to parse the output constraint. If that fails, there's
2988 no point in going further. */
2989 constraint = constraints[i];
2990 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
2991 &allows_mem, &allows_reg, &is_inout))
2992 return;
2994 if (! allows_reg
2995 && (allows_mem
2996 || is_inout
2997 || (DECL_P (val)
2998 && REG_P (DECL_RTL (val))
2999 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3000 mark_addressable (val);
3003 for (i = 0; i < ninputs; ++i)
3005 bool allows_reg, allows_mem;
3006 const char *constraint;
3008 constraint = constraints[i + noutputs];
3009 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3010 constraints.address (),
3011 &allows_mem, &allows_reg))
3012 return;
3014 if (! allows_reg && allows_mem)
3015 mark_addressable (input_tvec[i]);
3018 /* Second pass evaluates arguments. */
3020 /* Make sure stack is consistent for asm goto. */
3021 if (nlabels > 0)
3022 do_pending_stack_adjust ();
3023 int old_generating_concat_p = generating_concat_p;
3025 /* Vector of RTX's of evaluated output operands. */
3026 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3027 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3028 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3030 output_rvec.safe_grow (noutputs);
3032 for (i = 0; i < noutputs; ++i)
3034 tree val = output_tvec[i];
3035 tree type = TREE_TYPE (val);
3036 bool is_inout, allows_reg, allows_mem, ok;
3037 rtx op;
3039 ok = parse_output_constraint (&constraints[i], i, ninputs,
3040 noutputs, &allows_mem, &allows_reg,
3041 &is_inout);
3042 gcc_assert (ok);
3044 /* If an output operand is not a decl or indirect ref and our constraint
3045 allows a register, make a temporary to act as an intermediate.
3046 Make the asm insn write into that, then we will copy it to
3047 the real output operand. Likewise for promoted variables. */
3049 generating_concat_p = 0;
3051 if ((TREE_CODE (val) == INDIRECT_REF && allows_mem)
3052 || (DECL_P (val)
3053 && (allows_mem || REG_P (DECL_RTL (val)))
3054 && ! (REG_P (DECL_RTL (val))
3055 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3056 || ! allows_reg
3057 || is_inout
3058 || TREE_ADDRESSABLE (type))
3060 op = expand_expr (val, NULL_RTX, VOIDmode,
3061 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3062 if (MEM_P (op))
3063 op = validize_mem (op);
3065 if (! allows_reg && !MEM_P (op))
3066 error ("output number %d not directly addressable", i);
3067 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3068 || GET_CODE (op) == CONCAT)
3070 rtx old_op = op;
3071 op = gen_reg_rtx (GET_MODE (op));
3073 generating_concat_p = old_generating_concat_p;
3075 if (is_inout)
3076 emit_move_insn (op, old_op);
3078 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3079 emit_move_insn (old_op, op);
3080 after_rtl_seq = get_insns ();
3081 after_rtl_end = get_last_insn ();
3082 end_sequence ();
3085 else
3087 op = assign_temp (type, 0, 1);
3088 op = validize_mem (op);
3089 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3090 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3092 generating_concat_p = old_generating_concat_p;
3094 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3095 expand_assignment (val, make_tree (type, op), false);
3096 after_rtl_seq = get_insns ();
3097 after_rtl_end = get_last_insn ();
3098 end_sequence ();
3100 output_rvec[i] = op;
3102 if (is_inout)
3103 inout_opnum.safe_push (i);
3106 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3107 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3109 input_rvec.safe_grow (ninputs);
3110 input_mode.safe_grow (ninputs);
3112 generating_concat_p = 0;
3114 for (i = 0; i < ninputs; ++i)
3116 tree val = input_tvec[i];
3117 tree type = TREE_TYPE (val);
3118 bool allows_reg, allows_mem, ok;
3119 const char *constraint;
3120 rtx op;
3122 constraint = constraints[i + noutputs];
3123 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3124 constraints.address (),
3125 &allows_mem, &allows_reg);
3126 gcc_assert (ok);
3128 /* EXPAND_INITIALIZER will not generate code for valid initializer
3129 constants, but will still generate code for other types of operand.
3130 This is the behavior we want for constant constraints. */
3131 op = expand_expr (val, NULL_RTX, VOIDmode,
3132 allows_reg ? EXPAND_NORMAL
3133 : allows_mem ? EXPAND_MEMORY
3134 : EXPAND_INITIALIZER);
3136 /* Never pass a CONCAT to an ASM. */
3137 if (GET_CODE (op) == CONCAT)
3138 op = force_reg (GET_MODE (op), op);
3139 else if (MEM_P (op))
3140 op = validize_mem (op);
3142 if (asm_operand_ok (op, constraint, NULL) <= 0)
3144 if (allows_reg && TYPE_MODE (type) != BLKmode)
3145 op = force_reg (TYPE_MODE (type), op);
3146 else if (!allows_mem)
3147 warning (0, "asm operand %d probably doesn%'t match constraints",
3148 i + noutputs);
3149 else if (MEM_P (op))
3151 /* We won't recognize either volatile memory or memory
3152 with a queued address as available a memory_operand
3153 at this point. Ignore it: clearly this *is* a memory. */
3155 else
3156 gcc_unreachable ();
3158 input_rvec[i] = op;
3159 input_mode[i] = TYPE_MODE (type);
3162 /* For in-out operands, copy output rtx to input rtx. */
3163 unsigned ninout = inout_opnum.length();
3164 for (i = 0; i < ninout; i++)
3166 int j = inout_opnum[i];
3167 rtx o = output_rvec[j];
3169 input_rvec.safe_push (o);
3170 input_mode.safe_push (GET_MODE (o));
3172 char buffer[16];
3173 sprintf (buffer, "%d", j);
3174 constraints.safe_push (ggc_strdup (buffer));
3176 ninputs += ninout;
3178 /* Sometimes we wish to automatically clobber registers across an asm.
3179 Case in point is when the i386 backend moved from cc0 to a hard reg --
3180 maintaining source-level compatibility means automatically clobbering
3181 the flags register. */
3182 rtx_insn *after_md_seq = NULL;
3183 if (targetm.md_asm_adjust)
3184 after_md_seq = targetm.md_asm_adjust (output_rvec, input_rvec,
3185 constraints, clobber_rvec,
3186 clobbered_regs);
3188 /* Do not allow the hook to change the output and input count,
3189 lest it mess up the operand numbering. */
3190 gcc_assert (output_rvec.length() == noutputs);
3191 gcc_assert (input_rvec.length() == ninputs);
3192 gcc_assert (constraints.length() == noutputs + ninputs);
3194 /* But it certainly can adjust the clobbers. */
3195 nclobbers = clobber_rvec.length();
3197 /* Third pass checks for easy conflicts. */
3198 /* ??? Why are we doing this on trees instead of rtx. */
3200 bool clobber_conflict_found = 0;
3201 for (i = 0; i < noutputs; ++i)
3202 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3203 clobber_conflict_found = 1;
3204 for (i = 0; i < ninputs - ninout; ++i)
3205 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3206 clobber_conflict_found = 1;
3208 /* Make vectors for the expression-rtx, constraint strings,
3209 and named operands. */
3211 rtvec argvec = rtvec_alloc (ninputs);
3212 rtvec constraintvec = rtvec_alloc (ninputs);
3213 rtvec labelvec = rtvec_alloc (nlabels);
3215 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3216 : GET_MODE (output_rvec[0])),
3217 ggc_strdup (gimple_asm_string (stmt)),
3218 "", 0, argvec, constraintvec,
3219 labelvec, locus);
3220 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3222 for (i = 0; i < ninputs; ++i)
3224 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3225 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3226 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3227 constraints[i + noutputs],
3228 locus);
3231 /* Copy labels to the vector. */
3232 rtx_code_label *fallthru_label = NULL;
3233 if (nlabels > 0)
3235 basic_block fallthru_bb = NULL;
3236 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3237 if (fallthru)
3238 fallthru_bb = fallthru->dest;
3240 for (i = 0; i < nlabels; ++i)
3242 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3243 rtx_insn *r;
3244 /* If asm goto has any labels in the fallthru basic block, use
3245 a label that we emit immediately after the asm goto. Expansion
3246 may insert further instructions into the same basic block after
3247 asm goto and if we don't do this, insertion of instructions on
3248 the fallthru edge might misbehave. See PR58670. */
3249 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3251 if (fallthru_label == NULL_RTX)
3252 fallthru_label = gen_label_rtx ();
3253 r = fallthru_label;
3255 else
3256 r = label_rtx (label);
3257 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3261 /* Now, for each output, construct an rtx
3262 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3263 ARGVEC CONSTRAINTS OPNAMES))
3264 If there is more than one, put them inside a PARALLEL. */
3266 if (nlabels > 0 && nclobbers == 0)
3268 gcc_assert (noutputs == 0);
3269 emit_jump_insn (body);
3271 else if (noutputs == 0 && nclobbers == 0)
3273 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3274 emit_insn (body);
3276 else if (noutputs == 1 && nclobbers == 0)
3278 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3279 emit_insn (gen_rtx_SET (output_rvec[0], body));
3281 else
3283 rtx obody = body;
3284 int num = noutputs;
3286 if (num == 0)
3287 num = 1;
3289 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3291 /* For each output operand, store a SET. */
3292 for (i = 0; i < noutputs; ++i)
3294 rtx src, o = output_rvec[i];
3295 if (i == 0)
3297 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3298 src = obody;
3300 else
3302 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3303 ASM_OPERANDS_TEMPLATE (obody),
3304 constraints[i], i, argvec,
3305 constraintvec, labelvec, locus);
3306 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3308 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3311 /* If there are no outputs (but there are some clobbers)
3312 store the bare ASM_OPERANDS into the PARALLEL. */
3313 if (i == 0)
3314 XVECEXP (body, 0, i++) = obody;
3316 /* Store (clobber REG) for each clobbered register specified. */
3317 for (unsigned j = 0; j < nclobbers; ++j)
3319 rtx clobbered_reg = clobber_rvec[j];
3321 /* Do sanity check for overlap between clobbers and respectively
3322 input and outputs that hasn't been handled. Such overlap
3323 should have been detected and reported above. */
3324 if (!clobber_conflict_found && REG_P (clobbered_reg))
3326 /* We test the old body (obody) contents to avoid
3327 tripping over the under-construction body. */
3328 for (unsigned k = 0; k < noutputs; ++k)
3329 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3330 internal_error ("asm clobber conflict with output operand");
3332 for (unsigned k = 0; k < ninputs - ninout; ++k)
3333 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3334 internal_error ("asm clobber conflict with input operand");
3337 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3340 if (nlabels > 0)
3341 emit_jump_insn (body);
3342 else
3343 emit_insn (body);
3346 generating_concat_p = old_generating_concat_p;
3348 if (fallthru_label)
3349 emit_label (fallthru_label);
3351 if (after_md_seq)
3352 emit_insn (after_md_seq);
3353 if (after_rtl_seq)
3354 emit_insn (after_rtl_seq);
3356 free_temp_slots ();
3357 crtl->has_asm_statement = 1;
3360 /* Emit code to jump to the address
3361 specified by the pointer expression EXP. */
3363 static void
3364 expand_computed_goto (tree exp)
3366 rtx x = expand_normal (exp);
3368 do_pending_stack_adjust ();
3369 emit_indirect_jump (x);
3372 /* Generate RTL code for a `goto' statement with target label LABEL.
3373 LABEL should be a LABEL_DECL tree node that was or will later be
3374 defined with `expand_label'. */
3376 static void
3377 expand_goto (tree label)
3379 if (flag_checking)
3381 /* Check for a nonlocal goto to a containing function. Should have
3382 gotten translated to __builtin_nonlocal_goto. */
3383 tree context = decl_function_context (label);
3384 gcc_assert (!context || context == current_function_decl);
3387 emit_jump (jump_target_rtx (label));
3390 /* Output a return with no value. */
3392 static void
3393 expand_null_return_1 (void)
3395 clear_pending_stack_adjust ();
3396 do_pending_stack_adjust ();
3397 emit_jump (return_label);
3400 /* Generate RTL to return from the current function, with no value.
3401 (That is, we do not do anything about returning any value.) */
3403 void
3404 expand_null_return (void)
3406 /* If this function was declared to return a value, but we
3407 didn't, clobber the return registers so that they are not
3408 propagated live to the rest of the function. */
3409 clobber_return_register ();
3411 expand_null_return_1 ();
3414 /* Generate RTL to return from the current function, with value VAL. */
3416 static void
3417 expand_value_return (rtx val)
3419 /* Copy the value to the return location unless it's already there. */
3421 tree decl = DECL_RESULT (current_function_decl);
3422 rtx return_reg = DECL_RTL (decl);
3423 if (return_reg != val)
3425 tree funtype = TREE_TYPE (current_function_decl);
3426 tree type = TREE_TYPE (decl);
3427 int unsignedp = TYPE_UNSIGNED (type);
3428 machine_mode old_mode = DECL_MODE (decl);
3429 machine_mode mode;
3430 if (DECL_BY_REFERENCE (decl))
3431 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3432 else
3433 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3435 if (mode != old_mode)
3436 val = convert_modes (mode, old_mode, val, unsignedp);
3438 if (GET_CODE (return_reg) == PARALLEL)
3439 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3440 else
3441 emit_move_insn (return_reg, val);
3444 expand_null_return_1 ();
3447 /* Generate RTL to evaluate the expression RETVAL and return it
3448 from the current function. */
3450 static void
3451 expand_return (tree retval)
3453 rtx result_rtl;
3454 rtx val = 0;
3455 tree retval_rhs;
3457 /* If function wants no value, give it none. */
3458 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3460 expand_normal (retval);
3461 expand_null_return ();
3462 return;
3465 if (retval == error_mark_node)
3467 /* Treat this like a return of no value from a function that
3468 returns a value. */
3469 expand_null_return ();
3470 return;
3472 else if ((TREE_CODE (retval) == MODIFY_EXPR
3473 || TREE_CODE (retval) == INIT_EXPR)
3474 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3475 retval_rhs = TREE_OPERAND (retval, 1);
3476 else
3477 retval_rhs = retval;
3479 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3481 /* If we are returning the RESULT_DECL, then the value has already
3482 been stored into it, so we don't have to do anything special. */
3483 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3484 expand_value_return (result_rtl);
3486 /* If the result is an aggregate that is being returned in one (or more)
3487 registers, load the registers here. */
3489 else if (retval_rhs != 0
3490 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3491 && REG_P (result_rtl))
3493 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3494 if (val)
3496 /* Use the mode of the result value on the return register. */
3497 PUT_MODE (result_rtl, GET_MODE (val));
3498 expand_value_return (val);
3500 else
3501 expand_null_return ();
3503 else if (retval_rhs != 0
3504 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3505 && (REG_P (result_rtl)
3506 || (GET_CODE (result_rtl) == PARALLEL)))
3508 /* Compute the return value into a temporary (usually a pseudo reg). */
3510 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3511 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3512 val = force_not_mem (val);
3513 expand_value_return (val);
3515 else
3517 /* No hard reg used; calculate value into hard return reg. */
3518 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3519 expand_value_return (result_rtl);
3523 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3524 register, tell the rtl optimizers that its value is no longer
3525 needed. */
3527 static void
3528 expand_clobber (tree lhs)
3530 if (DECL_P (lhs))
3532 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3533 if (decl_rtl && REG_P (decl_rtl))
3535 machine_mode decl_mode = GET_MODE (decl_rtl);
3536 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3537 REGMODE_NATURAL_SIZE (decl_mode)))
3538 emit_clobber (decl_rtl);
3543 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3544 STMT that doesn't require special handling for outgoing edges. That
3545 is no tailcalls and no GIMPLE_COND. */
3547 static void
3548 expand_gimple_stmt_1 (gimple *stmt)
3550 tree op0;
3552 set_curr_insn_location (gimple_location (stmt));
3554 switch (gimple_code (stmt))
3556 case GIMPLE_GOTO:
3557 op0 = gimple_goto_dest (stmt);
3558 if (TREE_CODE (op0) == LABEL_DECL)
3559 expand_goto (op0);
3560 else
3561 expand_computed_goto (op0);
3562 break;
3563 case GIMPLE_LABEL:
3564 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3565 break;
3566 case GIMPLE_NOP:
3567 case GIMPLE_PREDICT:
3568 break;
3569 case GIMPLE_SWITCH:
3571 gswitch *swtch = as_a <gswitch *> (stmt);
3572 if (gimple_switch_num_labels (swtch) == 1)
3573 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3574 else
3575 expand_case (swtch);
3577 break;
3578 case GIMPLE_ASM:
3579 expand_asm_stmt (as_a <gasm *> (stmt));
3580 break;
3581 case GIMPLE_CALL:
3582 expand_call_stmt (as_a <gcall *> (stmt));
3583 break;
3585 case GIMPLE_RETURN:
3587 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3589 if (op0 && op0 != error_mark_node)
3591 tree result = DECL_RESULT (current_function_decl);
3593 /* If we are not returning the current function's RESULT_DECL,
3594 build an assignment to it. */
3595 if (op0 != result)
3597 /* I believe that a function's RESULT_DECL is unique. */
3598 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3600 /* ??? We'd like to use simply expand_assignment here,
3601 but this fails if the value is of BLKmode but the return
3602 decl is a register. expand_return has special handling
3603 for this combination, which eventually should move
3604 to common code. See comments there. Until then, let's
3605 build a modify expression :-/ */
3606 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3607 result, op0);
3611 if (!op0)
3612 expand_null_return ();
3613 else
3614 expand_return (op0);
3616 break;
3618 case GIMPLE_ASSIGN:
3620 gassign *assign_stmt = as_a <gassign *> (stmt);
3621 tree lhs = gimple_assign_lhs (assign_stmt);
3623 /* Tree expand used to fiddle with |= and &= of two bitfield
3624 COMPONENT_REFs here. This can't happen with gimple, the LHS
3625 of binary assigns must be a gimple reg. */
3627 if (TREE_CODE (lhs) != SSA_NAME
3628 || get_gimple_rhs_class (gimple_expr_code (stmt))
3629 == GIMPLE_SINGLE_RHS)
3631 tree rhs = gimple_assign_rhs1 (assign_stmt);
3632 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt))
3633 == GIMPLE_SINGLE_RHS);
3634 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3635 /* Do not put locations on possibly shared trees. */
3636 && !is_gimple_min_invariant (rhs))
3637 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3638 if (TREE_CLOBBER_P (rhs))
3639 /* This is a clobber to mark the going out of scope for
3640 this LHS. */
3641 expand_clobber (lhs);
3642 else
3643 expand_assignment (lhs, rhs,
3644 gimple_assign_nontemporal_move_p (
3645 assign_stmt));
3647 else
3649 rtx target, temp;
3650 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3651 struct separate_ops ops;
3652 bool promoted = false;
3654 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3655 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3656 promoted = true;
3658 ops.code = gimple_assign_rhs_code (assign_stmt);
3659 ops.type = TREE_TYPE (lhs);
3660 switch (get_gimple_rhs_class (ops.code))
3662 case GIMPLE_TERNARY_RHS:
3663 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3664 /* Fallthru */
3665 case GIMPLE_BINARY_RHS:
3666 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3667 /* Fallthru */
3668 case GIMPLE_UNARY_RHS:
3669 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3670 break;
3671 default:
3672 gcc_unreachable ();
3674 ops.location = gimple_location (stmt);
3676 /* If we want to use a nontemporal store, force the value to
3677 register first. If we store into a promoted register,
3678 don't directly expand to target. */
3679 temp = nontemporal || promoted ? NULL_RTX : target;
3680 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3681 EXPAND_NORMAL);
3683 if (temp == target)
3685 else if (promoted)
3687 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3688 /* If TEMP is a VOIDmode constant, use convert_modes to make
3689 sure that we properly convert it. */
3690 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3692 temp = convert_modes (GET_MODE (target),
3693 TYPE_MODE (ops.type),
3694 temp, unsignedp);
3695 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3696 GET_MODE (target), temp, unsignedp);
3699 convert_move (SUBREG_REG (target), temp, unsignedp);
3701 else if (nontemporal && emit_storent_insn (target, temp))
3703 else
3705 temp = force_operand (temp, target);
3706 if (temp != target)
3707 emit_move_insn (target, temp);
3711 break;
3713 default:
3714 gcc_unreachable ();
3718 /* Expand one gimple statement STMT and return the last RTL instruction
3719 before any of the newly generated ones.
3721 In addition to generating the necessary RTL instructions this also
3722 sets REG_EH_REGION notes if necessary and sets the current source
3723 location for diagnostics. */
3725 static rtx_insn *
3726 expand_gimple_stmt (gimple *stmt)
3728 location_t saved_location = input_location;
3729 rtx_insn *last = get_last_insn ();
3730 int lp_nr;
3732 gcc_assert (cfun);
3734 /* We need to save and restore the current source location so that errors
3735 discovered during expansion are emitted with the right location. But
3736 it would be better if the diagnostic routines used the source location
3737 embedded in the tree nodes rather than globals. */
3738 if (gimple_has_location (stmt))
3739 input_location = gimple_location (stmt);
3741 expand_gimple_stmt_1 (stmt);
3743 /* Free any temporaries used to evaluate this statement. */
3744 free_temp_slots ();
3746 input_location = saved_location;
3748 /* Mark all insns that may trap. */
3749 lp_nr = lookup_stmt_eh_lp (stmt);
3750 if (lp_nr)
3752 rtx_insn *insn;
3753 for (insn = next_real_insn (last); insn;
3754 insn = next_real_insn (insn))
3756 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3757 /* If we want exceptions for non-call insns, any
3758 may_trap_p instruction may throw. */
3759 && GET_CODE (PATTERN (insn)) != CLOBBER
3760 && GET_CODE (PATTERN (insn)) != CLOBBER_HIGH
3761 && GET_CODE (PATTERN (insn)) != USE
3762 && insn_could_throw_p (insn))
3763 make_reg_eh_region_note (insn, 0, lp_nr);
3767 return last;
3770 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3771 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3772 generated a tail call (something that might be denied by the ABI
3773 rules governing the call; see calls.c).
3775 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3776 can still reach the rest of BB. The case here is __builtin_sqrt,
3777 where the NaN result goes through the external function (with a
3778 tailcall) and the normal result happens via a sqrt instruction. */
3780 static basic_block
3781 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
3783 rtx_insn *last2, *last;
3784 edge e;
3785 edge_iterator ei;
3786 profile_probability probability;
3788 last2 = last = expand_gimple_stmt (stmt);
3790 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3791 if (CALL_P (last) && SIBLING_CALL_P (last))
3792 goto found;
3794 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3796 *can_fallthru = true;
3797 return NULL;
3799 found:
3800 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3801 Any instructions emitted here are about to be deleted. */
3802 do_pending_stack_adjust ();
3804 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3805 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3806 EH or abnormal edges, we shouldn't have created a tail call in
3807 the first place. So it seems to me we should just be removing
3808 all edges here, or redirecting the existing fallthru edge to
3809 the exit block. */
3811 probability = profile_probability::never ();
3813 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3815 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3817 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3818 e->dest->count -= e->count ();
3819 probability += e->probability;
3820 remove_edge (e);
3822 else
3823 ei_next (&ei);
3826 /* This is somewhat ugly: the call_expr expander often emits instructions
3827 after the sibcall (to perform the function return). These confuse the
3828 find_many_sub_basic_blocks code, so we need to get rid of these. */
3829 last = NEXT_INSN (last);
3830 gcc_assert (BARRIER_P (last));
3832 *can_fallthru = false;
3833 while (NEXT_INSN (last))
3835 /* For instance an sqrt builtin expander expands if with
3836 sibcall in the then and label for `else`. */
3837 if (LABEL_P (NEXT_INSN (last)))
3839 *can_fallthru = true;
3840 break;
3842 delete_insn (NEXT_INSN (last));
3845 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3846 | EDGE_SIBCALL);
3847 e->probability = probability;
3848 BB_END (bb) = last;
3849 update_bb_for_insn (bb);
3851 if (NEXT_INSN (last))
3853 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3855 last = BB_END (bb);
3856 if (BARRIER_P (last))
3857 BB_END (bb) = PREV_INSN (last);
3860 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3862 return bb;
3865 /* Return the difference between the floor and the truncated result of
3866 a signed division by OP1 with remainder MOD. */
3867 static rtx
3868 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3870 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
3871 return gen_rtx_IF_THEN_ELSE
3872 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3873 gen_rtx_IF_THEN_ELSE
3874 (mode, gen_rtx_LT (BImode,
3875 gen_rtx_DIV (mode, op1, mod),
3876 const0_rtx),
3877 constm1_rtx, const0_rtx),
3878 const0_rtx);
3881 /* Return the difference between the ceil and the truncated result of
3882 a signed division by OP1 with remainder MOD. */
3883 static rtx
3884 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3886 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
3887 return gen_rtx_IF_THEN_ELSE
3888 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3889 gen_rtx_IF_THEN_ELSE
3890 (mode, gen_rtx_GT (BImode,
3891 gen_rtx_DIV (mode, op1, mod),
3892 const0_rtx),
3893 const1_rtx, const0_rtx),
3894 const0_rtx);
3897 /* Return the difference between the ceil and the truncated result of
3898 an unsigned division by OP1 with remainder MOD. */
3899 static rtx
3900 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
3902 /* (mod != 0 ? 1 : 0) */
3903 return gen_rtx_IF_THEN_ELSE
3904 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3905 const1_rtx, const0_rtx);
3908 /* Return the difference between the rounded and the truncated result
3909 of a signed division by OP1 with remainder MOD. Halfway cases are
3910 rounded away from zero, rather than to the nearest even number. */
3911 static rtx
3912 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3914 /* (abs (mod) >= abs (op1) - abs (mod)
3915 ? (op1 / mod > 0 ? 1 : -1)
3916 : 0) */
3917 return gen_rtx_IF_THEN_ELSE
3918 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
3919 gen_rtx_MINUS (mode,
3920 gen_rtx_ABS (mode, op1),
3921 gen_rtx_ABS (mode, mod))),
3922 gen_rtx_IF_THEN_ELSE
3923 (mode, gen_rtx_GT (BImode,
3924 gen_rtx_DIV (mode, op1, mod),
3925 const0_rtx),
3926 const1_rtx, constm1_rtx),
3927 const0_rtx);
3930 /* Return the difference between the rounded and the truncated result
3931 of a unsigned division by OP1 with remainder MOD. Halfway cases
3932 are rounded away from zero, rather than to the nearest even
3933 number. */
3934 static rtx
3935 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
3937 /* (mod >= op1 - mod ? 1 : 0) */
3938 return gen_rtx_IF_THEN_ELSE
3939 (mode, gen_rtx_GE (BImode, mod,
3940 gen_rtx_MINUS (mode, op1, mod)),
3941 const1_rtx, const0_rtx);
3944 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
3945 any rtl. */
3947 static rtx
3948 convert_debug_memory_address (scalar_int_mode mode, rtx x,
3949 addr_space_t as)
3951 #ifndef POINTERS_EXTEND_UNSIGNED
3952 gcc_assert (mode == Pmode
3953 || mode == targetm.addr_space.address_mode (as));
3954 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
3955 #else
3956 rtx temp;
3958 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
3960 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
3961 return x;
3963 /* X must have some form of address mode already. */
3964 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
3965 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
3966 x = lowpart_subreg (mode, x, xmode);
3967 else if (POINTERS_EXTEND_UNSIGNED > 0)
3968 x = gen_rtx_ZERO_EXTEND (mode, x);
3969 else if (!POINTERS_EXTEND_UNSIGNED)
3970 x = gen_rtx_SIGN_EXTEND (mode, x);
3971 else
3973 switch (GET_CODE (x))
3975 case SUBREG:
3976 if ((SUBREG_PROMOTED_VAR_P (x)
3977 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
3978 || (GET_CODE (SUBREG_REG (x)) == PLUS
3979 && REG_P (XEXP (SUBREG_REG (x), 0))
3980 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
3981 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
3982 && GET_MODE (SUBREG_REG (x)) == mode)
3983 return SUBREG_REG (x);
3984 break;
3985 case LABEL_REF:
3986 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
3987 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
3988 return temp;
3989 case SYMBOL_REF:
3990 temp = shallow_copy_rtx (x);
3991 PUT_MODE (temp, mode);
3992 return temp;
3993 case CONST:
3994 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
3995 if (temp)
3996 temp = gen_rtx_CONST (mode, temp);
3997 return temp;
3998 case PLUS:
3999 case MINUS:
4000 if (CONST_INT_P (XEXP (x, 1)))
4002 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4003 if (temp)
4004 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4006 break;
4007 default:
4008 break;
4010 /* Don't know how to express ptr_extend as operation in debug info. */
4011 return NULL;
4013 #endif /* POINTERS_EXTEND_UNSIGNED */
4015 return x;
4018 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4019 by avoid_deep_ter_for_debug. */
4021 static hash_map<tree, tree> *deep_ter_debug_map;
4023 /* Split too deep TER chains for debug stmts using debug temporaries. */
4025 static void
4026 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4028 use_operand_p use_p;
4029 ssa_op_iter iter;
4030 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4032 tree use = USE_FROM_PTR (use_p);
4033 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4034 continue;
4035 gimple *g = get_gimple_for_ssa_name (use);
4036 if (g == NULL)
4037 continue;
4038 if (depth > 6 && !stmt_ends_bb_p (g))
4040 if (deep_ter_debug_map == NULL)
4041 deep_ter_debug_map = new hash_map<tree, tree>;
4043 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4044 if (vexpr != NULL)
4045 continue;
4046 vexpr = make_node (DEBUG_EXPR_DECL);
4047 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4048 DECL_ARTIFICIAL (vexpr) = 1;
4049 TREE_TYPE (vexpr) = TREE_TYPE (use);
4050 SET_DECL_MODE (vexpr, TYPE_MODE (TREE_TYPE (use)));
4051 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4052 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4053 avoid_deep_ter_for_debug (def_temp, 0);
4055 else
4056 avoid_deep_ter_for_debug (g, depth + 1);
4060 /* Return an RTX equivalent to the value of the parameter DECL. */
4062 static rtx
4063 expand_debug_parm_decl (tree decl)
4065 rtx incoming = DECL_INCOMING_RTL (decl);
4067 if (incoming
4068 && GET_MODE (incoming) != BLKmode
4069 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4070 || (MEM_P (incoming)
4071 && REG_P (XEXP (incoming, 0))
4072 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4074 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4076 #ifdef HAVE_window_save
4077 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4078 If the target machine has an explicit window save instruction, the
4079 actual entry value is the corresponding OUTGOING_REGNO instead. */
4080 if (REG_P (incoming)
4081 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4082 incoming
4083 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4084 OUTGOING_REGNO (REGNO (incoming)), 0);
4085 else if (MEM_P (incoming))
4087 rtx reg = XEXP (incoming, 0);
4088 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4090 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4091 incoming = replace_equiv_address_nv (incoming, reg);
4093 else
4094 incoming = copy_rtx (incoming);
4096 #endif
4098 ENTRY_VALUE_EXP (rtl) = incoming;
4099 return rtl;
4102 if (incoming
4103 && GET_MODE (incoming) != BLKmode
4104 && !TREE_ADDRESSABLE (decl)
4105 && MEM_P (incoming)
4106 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4107 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4108 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4109 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4110 return copy_rtx (incoming);
4112 return NULL_RTX;
4115 /* Return an RTX equivalent to the value of the tree expression EXP. */
4117 static rtx
4118 expand_debug_expr (tree exp)
4120 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4121 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4122 machine_mode inner_mode = VOIDmode;
4123 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4124 addr_space_t as;
4125 scalar_int_mode op0_mode, op1_mode, addr_mode;
4127 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4129 case tcc_expression:
4130 switch (TREE_CODE (exp))
4132 case COND_EXPR:
4133 case DOT_PROD_EXPR:
4134 case SAD_EXPR:
4135 case WIDEN_MULT_PLUS_EXPR:
4136 case WIDEN_MULT_MINUS_EXPR:
4137 goto ternary;
4139 case TRUTH_ANDIF_EXPR:
4140 case TRUTH_ORIF_EXPR:
4141 case TRUTH_AND_EXPR:
4142 case TRUTH_OR_EXPR:
4143 case TRUTH_XOR_EXPR:
4144 goto binary;
4146 case TRUTH_NOT_EXPR:
4147 goto unary;
4149 default:
4150 break;
4152 break;
4154 ternary:
4155 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4156 if (!op2)
4157 return NULL_RTX;
4158 /* Fall through. */
4160 binary:
4161 case tcc_binary:
4162 if (mode == BLKmode)
4163 return NULL_RTX;
4164 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4165 if (!op1)
4166 return NULL_RTX;
4167 switch (TREE_CODE (exp))
4169 case LSHIFT_EXPR:
4170 case RSHIFT_EXPR:
4171 case LROTATE_EXPR:
4172 case RROTATE_EXPR:
4173 case WIDEN_LSHIFT_EXPR:
4174 /* Ensure second operand isn't wider than the first one. */
4175 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4176 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4177 && (GET_MODE_UNIT_PRECISION (mode)
4178 < GET_MODE_PRECISION (op1_mode)))
4179 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4180 break;
4181 default:
4182 break;
4184 /* Fall through. */
4186 unary:
4187 case tcc_unary:
4188 if (mode == BLKmode)
4189 return NULL_RTX;
4190 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4191 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4192 if (!op0)
4193 return NULL_RTX;
4194 break;
4196 case tcc_comparison:
4197 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4198 goto binary;
4200 case tcc_type:
4201 case tcc_statement:
4202 gcc_unreachable ();
4204 case tcc_constant:
4205 case tcc_exceptional:
4206 case tcc_declaration:
4207 case tcc_reference:
4208 case tcc_vl_exp:
4209 break;
4212 switch (TREE_CODE (exp))
4214 case STRING_CST:
4215 if (!lookup_constant_def (exp))
4217 if (strlen (TREE_STRING_POINTER (exp)) + 1
4218 != (size_t) TREE_STRING_LENGTH (exp))
4219 return NULL_RTX;
4220 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4221 op0 = gen_rtx_MEM (BLKmode, op0);
4222 set_mem_attributes (op0, exp, 0);
4223 return op0;
4225 /* Fall through. */
4227 case INTEGER_CST:
4228 case REAL_CST:
4229 case FIXED_CST:
4230 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4231 return op0;
4233 case POLY_INT_CST:
4234 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4236 case COMPLEX_CST:
4237 gcc_assert (COMPLEX_MODE_P (mode));
4238 op0 = expand_debug_expr (TREE_REALPART (exp));
4239 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4240 return gen_rtx_CONCAT (mode, op0, op1);
4242 case DEBUG_EXPR_DECL:
4243 op0 = DECL_RTL_IF_SET (exp);
4245 if (op0)
4246 return op0;
4248 op0 = gen_rtx_DEBUG_EXPR (mode);
4249 DEBUG_EXPR_TREE_DECL (op0) = exp;
4250 SET_DECL_RTL (exp, op0);
4252 return op0;
4254 case VAR_DECL:
4255 case PARM_DECL:
4256 case FUNCTION_DECL:
4257 case LABEL_DECL:
4258 case CONST_DECL:
4259 case RESULT_DECL:
4260 op0 = DECL_RTL_IF_SET (exp);
4262 /* This decl was probably optimized away. */
4263 if (!op0)
4265 if (!VAR_P (exp)
4266 || DECL_EXTERNAL (exp)
4267 || !TREE_STATIC (exp)
4268 || !DECL_NAME (exp)
4269 || DECL_HARD_REGISTER (exp)
4270 || DECL_IN_CONSTANT_POOL (exp)
4271 || mode == VOIDmode)
4272 return NULL;
4274 op0 = make_decl_rtl_for_debug (exp);
4275 if (!MEM_P (op0)
4276 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4277 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4278 return NULL;
4280 else
4281 op0 = copy_rtx (op0);
4283 if (GET_MODE (op0) == BLKmode
4284 /* If op0 is not BLKmode, but mode is, adjust_mode
4285 below would ICE. While it is likely a FE bug,
4286 try to be robust here. See PR43166. */
4287 || mode == BLKmode
4288 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4290 gcc_assert (MEM_P (op0));
4291 op0 = adjust_address_nv (op0, mode, 0);
4292 return op0;
4295 /* Fall through. */
4297 adjust_mode:
4298 case PAREN_EXPR:
4299 CASE_CONVERT:
4301 inner_mode = GET_MODE (op0);
4303 if (mode == inner_mode)
4304 return op0;
4306 if (inner_mode == VOIDmode)
4308 if (TREE_CODE (exp) == SSA_NAME)
4309 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4310 else
4311 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4312 if (mode == inner_mode)
4313 return op0;
4316 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4318 if (GET_MODE_UNIT_BITSIZE (mode)
4319 == GET_MODE_UNIT_BITSIZE (inner_mode))
4320 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4321 else if (GET_MODE_UNIT_BITSIZE (mode)
4322 < GET_MODE_UNIT_BITSIZE (inner_mode))
4323 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4324 else
4325 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4327 else if (FLOAT_MODE_P (mode))
4329 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4330 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4331 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4332 else
4333 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4335 else if (FLOAT_MODE_P (inner_mode))
4337 if (unsignedp)
4338 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4339 else
4340 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4342 else if (GET_MODE_UNIT_PRECISION (mode)
4343 == GET_MODE_UNIT_PRECISION (inner_mode))
4344 op0 = lowpart_subreg (mode, op0, inner_mode);
4345 else if (GET_MODE_UNIT_PRECISION (mode)
4346 < GET_MODE_UNIT_PRECISION (inner_mode))
4347 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4348 else if (UNARY_CLASS_P (exp)
4349 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4350 : unsignedp)
4351 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4352 else
4353 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4355 return op0;
4358 case MEM_REF:
4359 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4361 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4362 TREE_OPERAND (exp, 0),
4363 TREE_OPERAND (exp, 1));
4364 if (newexp)
4365 return expand_debug_expr (newexp);
4367 /* FALLTHROUGH */
4368 case INDIRECT_REF:
4369 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4370 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4371 if (!op0)
4372 return NULL;
4374 if (TREE_CODE (exp) == MEM_REF)
4376 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4377 || (GET_CODE (op0) == PLUS
4378 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4379 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4380 Instead just use get_inner_reference. */
4381 goto component_ref;
4383 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4384 poly_int64 offset;
4385 if (!op1 || !poly_int_rtx_p (op1, &offset))
4386 return NULL;
4388 op0 = plus_constant (inner_mode, op0, offset);
4391 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4393 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4394 op0, as);
4395 if (op0 == NULL_RTX)
4396 return NULL;
4398 op0 = gen_rtx_MEM (mode, op0);
4399 set_mem_attributes (op0, exp, 0);
4400 if (TREE_CODE (exp) == MEM_REF
4401 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4402 set_mem_expr (op0, NULL_TREE);
4403 set_mem_addr_space (op0, as);
4405 return op0;
4407 case TARGET_MEM_REF:
4408 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4409 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4410 return NULL;
4412 op0 = expand_debug_expr
4413 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4414 if (!op0)
4415 return NULL;
4417 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4418 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4419 op0, as);
4420 if (op0 == NULL_RTX)
4421 return NULL;
4423 op0 = gen_rtx_MEM (mode, op0);
4425 set_mem_attributes (op0, exp, 0);
4426 set_mem_addr_space (op0, as);
4428 return op0;
4430 component_ref:
4431 case ARRAY_REF:
4432 case ARRAY_RANGE_REF:
4433 case COMPONENT_REF:
4434 case BIT_FIELD_REF:
4435 case REALPART_EXPR:
4436 case IMAGPART_EXPR:
4437 case VIEW_CONVERT_EXPR:
4439 machine_mode mode1;
4440 poly_int64 bitsize, bitpos;
4441 tree offset;
4442 int reversep, volatilep = 0;
4443 tree tem
4444 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4445 &unsignedp, &reversep, &volatilep);
4446 rtx orig_op0;
4448 if (known_eq (bitsize, 0))
4449 return NULL;
4451 orig_op0 = op0 = expand_debug_expr (tem);
4453 if (!op0)
4454 return NULL;
4456 if (offset)
4458 machine_mode addrmode, offmode;
4460 if (!MEM_P (op0))
4461 return NULL;
4463 op0 = XEXP (op0, 0);
4464 addrmode = GET_MODE (op0);
4465 if (addrmode == VOIDmode)
4466 addrmode = Pmode;
4468 op1 = expand_debug_expr (offset);
4469 if (!op1)
4470 return NULL;
4472 offmode = GET_MODE (op1);
4473 if (offmode == VOIDmode)
4474 offmode = TYPE_MODE (TREE_TYPE (offset));
4476 if (addrmode != offmode)
4477 op1 = lowpart_subreg (addrmode, op1, offmode);
4479 /* Don't use offset_address here, we don't need a
4480 recognizable address, and we don't want to generate
4481 code. */
4482 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4483 op0, op1));
4486 if (MEM_P (op0))
4488 if (mode1 == VOIDmode)
4490 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4491 return NULL;
4492 /* Bitfield. */
4493 mode1 = smallest_int_mode_for_size (bitsize);
4495 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4496 if (maybe_ne (bytepos, 0))
4498 op0 = adjust_address_nv (op0, mode1, bytepos);
4499 bitpos = num_trailing_bits (bitpos);
4501 else if (known_eq (bitpos, 0)
4502 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4503 op0 = adjust_address_nv (op0, mode, 0);
4504 else if (GET_MODE (op0) != mode1)
4505 op0 = adjust_address_nv (op0, mode1, 0);
4506 else
4507 op0 = copy_rtx (op0);
4508 if (op0 == orig_op0)
4509 op0 = shallow_copy_rtx (op0);
4510 set_mem_attributes (op0, exp, 0);
4513 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4514 return op0;
4516 if (maybe_lt (bitpos, 0))
4517 return NULL;
4519 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4520 return NULL;
4522 poly_int64 bytepos;
4523 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4524 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4526 machine_mode opmode = GET_MODE (op0);
4528 if (opmode == VOIDmode)
4529 opmode = TYPE_MODE (TREE_TYPE (tem));
4531 /* This condition may hold if we're expanding the address
4532 right past the end of an array that turned out not to
4533 be addressable (i.e., the address was only computed in
4534 debug stmts). The gen_subreg below would rightfully
4535 crash, and the address doesn't really exist, so just
4536 drop it. */
4537 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4538 return NULL;
4540 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4541 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4544 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4545 && TYPE_UNSIGNED (TREE_TYPE (exp))
4546 ? SIGN_EXTRACT
4547 : ZERO_EXTRACT, mode,
4548 GET_MODE (op0) != VOIDmode
4549 ? GET_MODE (op0)
4550 : TYPE_MODE (TREE_TYPE (tem)),
4551 op0, gen_int_mode (bitsize, word_mode),
4552 gen_int_mode (bitpos, word_mode));
4555 case ABS_EXPR:
4556 case ABSU_EXPR:
4557 return simplify_gen_unary (ABS, mode, op0, mode);
4559 case NEGATE_EXPR:
4560 return simplify_gen_unary (NEG, mode, op0, mode);
4562 case BIT_NOT_EXPR:
4563 return simplify_gen_unary (NOT, mode, op0, mode);
4565 case FLOAT_EXPR:
4566 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4567 0)))
4568 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4569 inner_mode);
4571 case FIX_TRUNC_EXPR:
4572 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4573 inner_mode);
4575 case POINTER_PLUS_EXPR:
4576 /* For the rare target where pointers are not the same size as
4577 size_t, we need to check for mis-matched modes and correct
4578 the addend. */
4579 if (op0 && op1
4580 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4581 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4582 && op0_mode != op1_mode)
4584 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4585 /* If OP0 is a partial mode, then we must truncate, even
4586 if it has the same bitsize as OP1 as GCC's
4587 representation of partial modes is opaque. */
4588 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4589 && (GET_MODE_BITSIZE (op0_mode)
4590 == GET_MODE_BITSIZE (op1_mode))))
4591 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4592 else
4593 /* We always sign-extend, regardless of the signedness of
4594 the operand, because the operand is always unsigned
4595 here even if the original C expression is signed. */
4596 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4598 /* Fall through. */
4599 case PLUS_EXPR:
4600 return simplify_gen_binary (PLUS, mode, op0, op1);
4602 case MINUS_EXPR:
4603 case POINTER_DIFF_EXPR:
4604 return simplify_gen_binary (MINUS, mode, op0, op1);
4606 case MULT_EXPR:
4607 return simplify_gen_binary (MULT, mode, op0, op1);
4609 case RDIV_EXPR:
4610 case TRUNC_DIV_EXPR:
4611 case EXACT_DIV_EXPR:
4612 if (unsignedp)
4613 return simplify_gen_binary (UDIV, mode, op0, op1);
4614 else
4615 return simplify_gen_binary (DIV, mode, op0, op1);
4617 case TRUNC_MOD_EXPR:
4618 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4620 case FLOOR_DIV_EXPR:
4621 if (unsignedp)
4622 return simplify_gen_binary (UDIV, mode, op0, op1);
4623 else
4625 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4626 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4627 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4628 return simplify_gen_binary (PLUS, mode, div, adj);
4631 case FLOOR_MOD_EXPR:
4632 if (unsignedp)
4633 return simplify_gen_binary (UMOD, mode, op0, op1);
4634 else
4636 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4637 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4638 adj = simplify_gen_unary (NEG, mode,
4639 simplify_gen_binary (MULT, mode, adj, op1),
4640 mode);
4641 return simplify_gen_binary (PLUS, mode, mod, adj);
4644 case CEIL_DIV_EXPR:
4645 if (unsignedp)
4647 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4648 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4649 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4650 return simplify_gen_binary (PLUS, mode, div, adj);
4652 else
4654 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4655 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4656 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4657 return simplify_gen_binary (PLUS, mode, div, adj);
4660 case CEIL_MOD_EXPR:
4661 if (unsignedp)
4663 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4664 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4665 adj = simplify_gen_unary (NEG, mode,
4666 simplify_gen_binary (MULT, mode, adj, op1),
4667 mode);
4668 return simplify_gen_binary (PLUS, mode, mod, adj);
4670 else
4672 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4673 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4674 adj = simplify_gen_unary (NEG, mode,
4675 simplify_gen_binary (MULT, mode, adj, op1),
4676 mode);
4677 return simplify_gen_binary (PLUS, mode, mod, adj);
4680 case ROUND_DIV_EXPR:
4681 if (unsignedp)
4683 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4684 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4685 rtx adj = round_udiv_adjust (mode, mod, op1);
4686 return simplify_gen_binary (PLUS, mode, div, adj);
4688 else
4690 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4691 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4692 rtx adj = round_sdiv_adjust (mode, mod, op1);
4693 return simplify_gen_binary (PLUS, mode, div, adj);
4696 case ROUND_MOD_EXPR:
4697 if (unsignedp)
4699 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4700 rtx adj = round_udiv_adjust (mode, mod, op1);
4701 adj = simplify_gen_unary (NEG, mode,
4702 simplify_gen_binary (MULT, mode, adj, op1),
4703 mode);
4704 return simplify_gen_binary (PLUS, mode, mod, adj);
4706 else
4708 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4709 rtx adj = round_sdiv_adjust (mode, mod, op1);
4710 adj = simplify_gen_unary (NEG, mode,
4711 simplify_gen_binary (MULT, mode, adj, op1),
4712 mode);
4713 return simplify_gen_binary (PLUS, mode, mod, adj);
4716 case LSHIFT_EXPR:
4717 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4719 case RSHIFT_EXPR:
4720 if (unsignedp)
4721 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4722 else
4723 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4725 case LROTATE_EXPR:
4726 return simplify_gen_binary (ROTATE, mode, op0, op1);
4728 case RROTATE_EXPR:
4729 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4731 case MIN_EXPR:
4732 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4734 case MAX_EXPR:
4735 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4737 case BIT_AND_EXPR:
4738 case TRUTH_AND_EXPR:
4739 return simplify_gen_binary (AND, mode, op0, op1);
4741 case BIT_IOR_EXPR:
4742 case TRUTH_OR_EXPR:
4743 return simplify_gen_binary (IOR, mode, op0, op1);
4745 case BIT_XOR_EXPR:
4746 case TRUTH_XOR_EXPR:
4747 return simplify_gen_binary (XOR, mode, op0, op1);
4749 case TRUTH_ANDIF_EXPR:
4750 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4752 case TRUTH_ORIF_EXPR:
4753 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4755 case TRUTH_NOT_EXPR:
4756 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4758 case LT_EXPR:
4759 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4760 op0, op1);
4762 case LE_EXPR:
4763 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4764 op0, op1);
4766 case GT_EXPR:
4767 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4768 op0, op1);
4770 case GE_EXPR:
4771 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4772 op0, op1);
4774 case EQ_EXPR:
4775 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4777 case NE_EXPR:
4778 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4780 case UNORDERED_EXPR:
4781 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4783 case ORDERED_EXPR:
4784 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4786 case UNLT_EXPR:
4787 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4789 case UNLE_EXPR:
4790 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4792 case UNGT_EXPR:
4793 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4795 case UNGE_EXPR:
4796 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4798 case UNEQ_EXPR:
4799 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4801 case LTGT_EXPR:
4802 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4804 case COND_EXPR:
4805 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4807 case COMPLEX_EXPR:
4808 gcc_assert (COMPLEX_MODE_P (mode));
4809 if (GET_MODE (op0) == VOIDmode)
4810 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4811 if (GET_MODE (op1) == VOIDmode)
4812 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4813 return gen_rtx_CONCAT (mode, op0, op1);
4815 case CONJ_EXPR:
4816 if (GET_CODE (op0) == CONCAT)
4817 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4818 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4819 XEXP (op0, 1),
4820 GET_MODE_INNER (mode)));
4821 else
4823 scalar_mode imode = GET_MODE_INNER (mode);
4824 rtx re, im;
4826 if (MEM_P (op0))
4828 re = adjust_address_nv (op0, imode, 0);
4829 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4831 else
4833 scalar_int_mode ifmode;
4834 scalar_int_mode ihmode;
4835 rtx halfsize;
4836 if (!int_mode_for_mode (mode).exists (&ifmode)
4837 || !int_mode_for_mode (imode).exists (&ihmode))
4838 return NULL;
4839 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4840 re = op0;
4841 if (mode != ifmode)
4842 re = gen_rtx_SUBREG (ifmode, re, 0);
4843 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4844 if (imode != ihmode)
4845 re = gen_rtx_SUBREG (imode, re, 0);
4846 im = copy_rtx (op0);
4847 if (mode != ifmode)
4848 im = gen_rtx_SUBREG (ifmode, im, 0);
4849 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4850 if (imode != ihmode)
4851 im = gen_rtx_SUBREG (imode, im, 0);
4853 im = gen_rtx_NEG (imode, im);
4854 return gen_rtx_CONCAT (mode, re, im);
4857 case ADDR_EXPR:
4858 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4859 if (!op0 || !MEM_P (op0))
4861 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
4862 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
4863 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
4864 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
4865 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
4866 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
4868 if (handled_component_p (TREE_OPERAND (exp, 0)))
4870 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
4871 bool reverse;
4872 tree decl
4873 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
4874 &bitsize, &maxsize, &reverse);
4875 if ((VAR_P (decl)
4876 || TREE_CODE (decl) == PARM_DECL
4877 || TREE_CODE (decl) == RESULT_DECL)
4878 && (!TREE_ADDRESSABLE (decl)
4879 || target_for_debug_bind (decl))
4880 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
4881 && known_gt (bitsize, 0)
4882 && known_eq (bitsize, maxsize))
4884 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
4885 return plus_constant (mode, base, byteoffset);
4889 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
4890 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
4891 == ADDR_EXPR)
4893 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4894 0));
4895 if (op0 != NULL
4896 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4897 || (GET_CODE (op0) == PLUS
4898 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
4899 && CONST_INT_P (XEXP (op0, 1)))))
4901 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4902 1));
4903 poly_int64 offset;
4904 if (!op1 || !poly_int_rtx_p (op1, &offset))
4905 return NULL;
4907 return plus_constant (mode, op0, offset);
4911 return NULL;
4914 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
4915 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
4916 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
4918 return op0;
4920 case VECTOR_CST:
4922 unsigned HOST_WIDE_INT i, nelts;
4924 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
4925 return NULL;
4927 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
4929 for (i = 0; i < nelts; ++i)
4931 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
4932 if (!op1)
4933 return NULL;
4934 XVECEXP (op0, 0, i) = op1;
4937 return op0;
4940 case CONSTRUCTOR:
4941 if (TREE_CLOBBER_P (exp))
4942 return NULL;
4943 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
4945 unsigned i;
4946 unsigned HOST_WIDE_INT nelts;
4947 tree val;
4949 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
4950 goto flag_unsupported;
4952 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
4954 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
4956 op1 = expand_debug_expr (val);
4957 if (!op1)
4958 return NULL;
4959 XVECEXP (op0, 0, i) = op1;
4962 if (i < nelts)
4964 op1 = expand_debug_expr
4965 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
4967 if (!op1)
4968 return NULL;
4970 for (; i < nelts; i++)
4971 XVECEXP (op0, 0, i) = op1;
4974 return op0;
4976 else
4977 goto flag_unsupported;
4979 case CALL_EXPR:
4980 /* ??? Maybe handle some builtins? */
4981 return NULL;
4983 case SSA_NAME:
4985 gimple *g = get_gimple_for_ssa_name (exp);
4986 if (g)
4988 tree t = NULL_TREE;
4989 if (deep_ter_debug_map)
4991 tree *slot = deep_ter_debug_map->get (exp);
4992 if (slot)
4993 t = *slot;
4995 if (t == NULL_TREE)
4996 t = gimple_assign_rhs_to_tree (g);
4997 op0 = expand_debug_expr (t);
4998 if (!op0)
4999 return NULL;
5001 else
5003 /* If this is a reference to an incoming value of
5004 parameter that is never used in the code or where the
5005 incoming value is never used in the code, use
5006 PARM_DECL's DECL_RTL if set. */
5007 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5008 && SSA_NAME_VAR (exp)
5009 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5010 && has_zero_uses (exp))
5012 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5013 if (op0)
5014 goto adjust_mode;
5015 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5016 if (op0)
5017 goto adjust_mode;
5020 int part = var_to_partition (SA.map, exp);
5022 if (part == NO_PARTITION)
5023 return NULL;
5025 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5027 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5029 goto adjust_mode;
5032 case ERROR_MARK:
5033 return NULL;
5035 /* Vector stuff. For most of the codes we don't have rtl codes. */
5036 case REALIGN_LOAD_EXPR:
5037 case VEC_COND_EXPR:
5038 case VEC_PACK_FIX_TRUNC_EXPR:
5039 case VEC_PACK_FLOAT_EXPR:
5040 case VEC_PACK_SAT_EXPR:
5041 case VEC_PACK_TRUNC_EXPR:
5042 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5043 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5044 case VEC_UNPACK_FLOAT_HI_EXPR:
5045 case VEC_UNPACK_FLOAT_LO_EXPR:
5046 case VEC_UNPACK_HI_EXPR:
5047 case VEC_UNPACK_LO_EXPR:
5048 case VEC_WIDEN_MULT_HI_EXPR:
5049 case VEC_WIDEN_MULT_LO_EXPR:
5050 case VEC_WIDEN_MULT_EVEN_EXPR:
5051 case VEC_WIDEN_MULT_ODD_EXPR:
5052 case VEC_WIDEN_LSHIFT_HI_EXPR:
5053 case VEC_WIDEN_LSHIFT_LO_EXPR:
5054 case VEC_PERM_EXPR:
5055 case VEC_DUPLICATE_EXPR:
5056 case VEC_SERIES_EXPR:
5057 return NULL;
5059 /* Misc codes. */
5060 case ADDR_SPACE_CONVERT_EXPR:
5061 case FIXED_CONVERT_EXPR:
5062 case OBJ_TYPE_REF:
5063 case WITH_SIZE_EXPR:
5064 case BIT_INSERT_EXPR:
5065 return NULL;
5067 case DOT_PROD_EXPR:
5068 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5069 && SCALAR_INT_MODE_P (mode))
5072 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5073 0)))
5074 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5075 inner_mode);
5077 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5078 1)))
5079 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5080 inner_mode);
5081 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5082 return simplify_gen_binary (PLUS, mode, op0, op2);
5084 return NULL;
5086 case WIDEN_MULT_EXPR:
5087 case WIDEN_MULT_PLUS_EXPR:
5088 case WIDEN_MULT_MINUS_EXPR:
5089 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5090 && SCALAR_INT_MODE_P (mode))
5092 inner_mode = GET_MODE (op0);
5093 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5094 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5095 else
5096 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5097 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5098 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5099 else
5100 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5101 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5102 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5103 return op0;
5104 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5105 return simplify_gen_binary (PLUS, mode, op0, op2);
5106 else
5107 return simplify_gen_binary (MINUS, mode, op2, op0);
5109 return NULL;
5111 case MULT_HIGHPART_EXPR:
5112 /* ??? Similar to the above. */
5113 return NULL;
5115 case WIDEN_SUM_EXPR:
5116 case WIDEN_LSHIFT_EXPR:
5117 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5118 && SCALAR_INT_MODE_P (mode))
5121 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5122 0)))
5123 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5124 inner_mode);
5125 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5126 ? ASHIFT : PLUS, mode, op0, op1);
5128 return NULL;
5130 default:
5131 flag_unsupported:
5132 if (flag_checking)
5134 debug_tree (exp);
5135 gcc_unreachable ();
5137 return NULL;
5141 /* Return an RTX equivalent to the source bind value of the tree expression
5142 EXP. */
5144 static rtx
5145 expand_debug_source_expr (tree exp)
5147 rtx op0 = NULL_RTX;
5148 machine_mode mode = VOIDmode, inner_mode;
5150 switch (TREE_CODE (exp))
5152 case VAR_DECL:
5153 if (DECL_ABSTRACT_ORIGIN (exp))
5154 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5155 break;
5156 case PARM_DECL:
5158 mode = DECL_MODE (exp);
5159 op0 = expand_debug_parm_decl (exp);
5160 if (op0)
5161 break;
5162 /* See if this isn't an argument that has been completely
5163 optimized out. */
5164 if (!DECL_RTL_SET_P (exp)
5165 && !DECL_INCOMING_RTL (exp)
5166 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5168 tree aexp = DECL_ORIGIN (exp);
5169 if (DECL_CONTEXT (aexp)
5170 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5172 vec<tree, va_gc> **debug_args;
5173 unsigned int ix;
5174 tree ddecl;
5175 debug_args = decl_debug_args_lookup (current_function_decl);
5176 if (debug_args != NULL)
5178 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5179 ix += 2)
5180 if (ddecl == aexp)
5181 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5185 break;
5187 default:
5188 break;
5191 if (op0 == NULL_RTX)
5192 return NULL_RTX;
5194 inner_mode = GET_MODE (op0);
5195 if (mode == inner_mode)
5196 return op0;
5198 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5200 if (GET_MODE_UNIT_BITSIZE (mode)
5201 == GET_MODE_UNIT_BITSIZE (inner_mode))
5202 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5203 else if (GET_MODE_UNIT_BITSIZE (mode)
5204 < GET_MODE_UNIT_BITSIZE (inner_mode))
5205 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5206 else
5207 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5209 else if (FLOAT_MODE_P (mode))
5210 gcc_unreachable ();
5211 else if (FLOAT_MODE_P (inner_mode))
5213 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5214 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5215 else
5216 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5218 else if (GET_MODE_UNIT_PRECISION (mode)
5219 == GET_MODE_UNIT_PRECISION (inner_mode))
5220 op0 = lowpart_subreg (mode, op0, inner_mode);
5221 else if (GET_MODE_UNIT_PRECISION (mode)
5222 < GET_MODE_UNIT_PRECISION (inner_mode))
5223 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5224 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5225 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5226 else
5227 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5229 return op0;
5232 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5233 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5234 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5236 static void
5237 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5239 rtx exp = *exp_p;
5241 if (exp == NULL_RTX)
5242 return;
5244 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5245 return;
5247 if (depth == 4)
5249 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5250 rtx dval = make_debug_expr_from_rtl (exp);
5252 /* Emit a debug bind insn before INSN. */
5253 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5254 DEBUG_EXPR_TREE_DECL (dval), exp,
5255 VAR_INIT_STATUS_INITIALIZED);
5257 emit_debug_insn_before (bind, insn);
5258 *exp_p = dval;
5259 return;
5262 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5263 int i, j;
5264 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5265 switch (*format_ptr++)
5267 case 'e':
5268 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5269 break;
5271 case 'E':
5272 case 'V':
5273 for (j = 0; j < XVECLEN (exp, i); j++)
5274 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5275 break;
5277 default:
5278 break;
5282 /* Expand the _LOCs in debug insns. We run this after expanding all
5283 regular insns, so that any variables referenced in the function
5284 will have their DECL_RTLs set. */
5286 static void
5287 expand_debug_locations (void)
5289 rtx_insn *insn;
5290 rtx_insn *last = get_last_insn ();
5291 int save_strict_alias = flag_strict_aliasing;
5293 /* New alias sets while setting up memory attributes cause
5294 -fcompare-debug failures, even though it doesn't bring about any
5295 codegen changes. */
5296 flag_strict_aliasing = 0;
5298 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5299 if (DEBUG_BIND_INSN_P (insn))
5301 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5302 rtx val;
5303 rtx_insn *prev_insn, *insn2;
5304 machine_mode mode;
5306 if (value == NULL_TREE)
5307 val = NULL_RTX;
5308 else
5310 if (INSN_VAR_LOCATION_STATUS (insn)
5311 == VAR_INIT_STATUS_UNINITIALIZED)
5312 val = expand_debug_source_expr (value);
5313 /* The avoid_deep_ter_for_debug function inserts
5314 debug bind stmts after SSA_NAME definition, with the
5315 SSA_NAME as the whole bind location. Disable temporarily
5316 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5317 being defined in this DEBUG_INSN. */
5318 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5320 tree *slot = deep_ter_debug_map->get (value);
5321 if (slot)
5323 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5324 *slot = NULL_TREE;
5325 else
5326 slot = NULL;
5328 val = expand_debug_expr (value);
5329 if (slot)
5330 *slot = INSN_VAR_LOCATION_DECL (insn);
5332 else
5333 val = expand_debug_expr (value);
5334 gcc_assert (last == get_last_insn ());
5337 if (!val)
5338 val = gen_rtx_UNKNOWN_VAR_LOC ();
5339 else
5341 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5343 gcc_assert (mode == GET_MODE (val)
5344 || (GET_MODE (val) == VOIDmode
5345 && (CONST_SCALAR_INT_P (val)
5346 || GET_CODE (val) == CONST_FIXED
5347 || GET_CODE (val) == LABEL_REF)));
5350 INSN_VAR_LOCATION_LOC (insn) = val;
5351 prev_insn = PREV_INSN (insn);
5352 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5353 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5356 flag_strict_aliasing = save_strict_alias;
5359 /* Performs swapping operands of commutative operations to expand
5360 the expensive one first. */
5362 static void
5363 reorder_operands (basic_block bb)
5365 unsigned int *lattice; /* Hold cost of each statement. */
5366 unsigned int i = 0, n = 0;
5367 gimple_stmt_iterator gsi;
5368 gimple_seq stmts;
5369 gimple *stmt;
5370 bool swap;
5371 tree op0, op1;
5372 ssa_op_iter iter;
5373 use_operand_p use_p;
5374 gimple *def0, *def1;
5376 /* Compute cost of each statement using estimate_num_insns. */
5377 stmts = bb_seq (bb);
5378 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5380 stmt = gsi_stmt (gsi);
5381 if (!is_gimple_debug (stmt))
5382 gimple_set_uid (stmt, n++);
5384 lattice = XNEWVEC (unsigned int, n);
5385 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5387 unsigned cost;
5388 stmt = gsi_stmt (gsi);
5389 if (is_gimple_debug (stmt))
5390 continue;
5391 cost = estimate_num_insns (stmt, &eni_size_weights);
5392 lattice[i] = cost;
5393 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5395 tree use = USE_FROM_PTR (use_p);
5396 gimple *def_stmt;
5397 if (TREE_CODE (use) != SSA_NAME)
5398 continue;
5399 def_stmt = get_gimple_for_ssa_name (use);
5400 if (!def_stmt)
5401 continue;
5402 lattice[i] += lattice[gimple_uid (def_stmt)];
5404 i++;
5405 if (!is_gimple_assign (stmt)
5406 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5407 continue;
5408 op0 = gimple_op (stmt, 1);
5409 op1 = gimple_op (stmt, 2);
5410 if (TREE_CODE (op0) != SSA_NAME
5411 || TREE_CODE (op1) != SSA_NAME)
5412 continue;
5413 /* Swap operands if the second one is more expensive. */
5414 def0 = get_gimple_for_ssa_name (op0);
5415 def1 = get_gimple_for_ssa_name (op1);
5416 if (!def1)
5417 continue;
5418 swap = false;
5419 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5420 swap = true;
5421 if (swap)
5423 if (dump_file && (dump_flags & TDF_DETAILS))
5425 fprintf (dump_file, "Swap operands in stmt:\n");
5426 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5427 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5428 def0 ? lattice[gimple_uid (def0)] : 0,
5429 lattice[gimple_uid (def1)]);
5431 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5432 gimple_assign_rhs2_ptr (stmt));
5435 XDELETE (lattice);
5438 /* Expand basic block BB from GIMPLE trees to RTL. */
5440 static basic_block
5441 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5443 gimple_stmt_iterator gsi;
5444 gimple_seq stmts;
5445 gimple *stmt = NULL;
5446 rtx_note *note = NULL;
5447 rtx_insn *last;
5448 edge e;
5449 edge_iterator ei;
5451 if (dump_file)
5452 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5453 bb->index);
5455 /* Note that since we are now transitioning from GIMPLE to RTL, we
5456 cannot use the gsi_*_bb() routines because they expect the basic
5457 block to be in GIMPLE, instead of RTL. Therefore, we need to
5458 access the BB sequence directly. */
5459 if (optimize)
5460 reorder_operands (bb);
5461 stmts = bb_seq (bb);
5462 bb->il.gimple.seq = NULL;
5463 bb->il.gimple.phi_nodes = NULL;
5464 rtl_profile_for_bb (bb);
5465 init_rtl_bb_info (bb);
5466 bb->flags |= BB_RTL;
5468 /* Remove the RETURN_EXPR if we may fall though to the exit
5469 instead. */
5470 gsi = gsi_last (stmts);
5471 if (!gsi_end_p (gsi)
5472 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5474 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5476 gcc_assert (single_succ_p (bb));
5477 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5479 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5480 && !gimple_return_retval (ret_stmt))
5482 gsi_remove (&gsi, false);
5483 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5487 gsi = gsi_start (stmts);
5488 if (!gsi_end_p (gsi))
5490 stmt = gsi_stmt (gsi);
5491 if (gimple_code (stmt) != GIMPLE_LABEL)
5492 stmt = NULL;
5495 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5497 if (stmt || elt)
5499 gcc_checking_assert (!note);
5500 last = get_last_insn ();
5502 if (stmt)
5504 expand_gimple_stmt (stmt);
5505 gsi_next (&gsi);
5508 if (elt)
5509 emit_label (*elt);
5511 BB_HEAD (bb) = NEXT_INSN (last);
5512 if (NOTE_P (BB_HEAD (bb)))
5513 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5514 gcc_assert (LABEL_P (BB_HEAD (bb)));
5515 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5517 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5519 else
5520 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5522 if (note)
5523 NOTE_BASIC_BLOCK (note) = bb;
5525 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5527 basic_block new_bb;
5529 stmt = gsi_stmt (gsi);
5531 /* If this statement is a non-debug one, and we generate debug
5532 insns, then this one might be the last real use of a TERed
5533 SSA_NAME, but where there are still some debug uses further
5534 down. Expanding the current SSA name in such further debug
5535 uses by their RHS might lead to wrong debug info, as coalescing
5536 might make the operands of such RHS be placed into the same
5537 pseudo as something else. Like so:
5538 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5539 use(a_1);
5540 a_2 = ...
5541 #DEBUG ... => a_1
5542 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5543 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5544 the write to a_2 would actually have clobbered the place which
5545 formerly held a_0.
5547 So, instead of that, we recognize the situation, and generate
5548 debug temporaries at the last real use of TERed SSA names:
5549 a_1 = a_0 + 1;
5550 #DEBUG #D1 => a_1
5551 use(a_1);
5552 a_2 = ...
5553 #DEBUG ... => #D1
5555 if (MAY_HAVE_DEBUG_BIND_INSNS
5556 && SA.values
5557 && !is_gimple_debug (stmt))
5559 ssa_op_iter iter;
5560 tree op;
5561 gimple *def;
5563 location_t sloc = curr_insn_location ();
5565 /* Look for SSA names that have their last use here (TERed
5566 names always have only one real use). */
5567 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5568 if ((def = get_gimple_for_ssa_name (op)))
5570 imm_use_iterator imm_iter;
5571 use_operand_p use_p;
5572 bool have_debug_uses = false;
5574 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5576 if (gimple_debug_bind_p (USE_STMT (use_p)))
5578 have_debug_uses = true;
5579 break;
5583 if (have_debug_uses)
5585 /* OP is a TERed SSA name, with DEF its defining
5586 statement, and where OP is used in further debug
5587 instructions. Generate a debug temporary, and
5588 replace all uses of OP in debug insns with that
5589 temporary. */
5590 gimple *debugstmt;
5591 tree value = gimple_assign_rhs_to_tree (def);
5592 tree vexpr = make_node (DEBUG_EXPR_DECL);
5593 rtx val;
5594 machine_mode mode;
5596 set_curr_insn_location (gimple_location (def));
5598 DECL_ARTIFICIAL (vexpr) = 1;
5599 TREE_TYPE (vexpr) = TREE_TYPE (value);
5600 if (DECL_P (value))
5601 mode = DECL_MODE (value);
5602 else
5603 mode = TYPE_MODE (TREE_TYPE (value));
5604 SET_DECL_MODE (vexpr, mode);
5606 val = gen_rtx_VAR_LOCATION
5607 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5609 emit_debug_insn (val);
5611 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5613 if (!gimple_debug_bind_p (debugstmt))
5614 continue;
5616 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5617 SET_USE (use_p, vexpr);
5619 update_stmt (debugstmt);
5623 set_curr_insn_location (sloc);
5626 currently_expanding_gimple_stmt = stmt;
5628 /* Expand this statement, then evaluate the resulting RTL and
5629 fixup the CFG accordingly. */
5630 if (gimple_code (stmt) == GIMPLE_COND)
5632 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5633 if (new_bb)
5634 return new_bb;
5636 else if (is_gimple_debug (stmt))
5638 location_t sloc = curr_insn_location ();
5639 gimple_stmt_iterator nsi = gsi;
5641 for (;;)
5643 tree var;
5644 tree value = NULL_TREE;
5645 rtx val = NULL_RTX;
5646 machine_mode mode;
5648 if (!gimple_debug_nonbind_marker_p (stmt))
5650 if (gimple_debug_bind_p (stmt))
5652 var = gimple_debug_bind_get_var (stmt);
5654 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5655 && TREE_CODE (var) != LABEL_DECL
5656 && !target_for_debug_bind (var))
5657 goto delink_debug_stmt;
5659 if (DECL_P (var))
5660 mode = DECL_MODE (var);
5661 else
5662 mode = TYPE_MODE (TREE_TYPE (var));
5664 if (gimple_debug_bind_has_value_p (stmt))
5665 value = gimple_debug_bind_get_value (stmt);
5667 val = gen_rtx_VAR_LOCATION
5668 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5670 else if (gimple_debug_source_bind_p (stmt))
5672 var = gimple_debug_source_bind_get_var (stmt);
5674 value = gimple_debug_source_bind_get_value (stmt);
5676 mode = DECL_MODE (var);
5678 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5679 VAR_INIT_STATUS_UNINITIALIZED);
5681 else
5682 gcc_unreachable ();
5684 /* If this function was first compiled with markers
5685 enabled, but they're now disable (e.g. LTO), drop
5686 them on the floor. */
5687 else if (gimple_debug_nonbind_marker_p (stmt)
5688 && !MAY_HAVE_DEBUG_MARKER_INSNS)
5689 goto delink_debug_stmt;
5690 else if (gimple_debug_begin_stmt_p (stmt))
5691 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
5692 else if (gimple_debug_inline_entry_p (stmt))
5694 tree block = gimple_block (stmt);
5696 if (block)
5697 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
5698 else
5699 goto delink_debug_stmt;
5701 else
5702 gcc_unreachable ();
5704 last = get_last_insn ();
5706 set_curr_insn_location (gimple_location (stmt));
5708 emit_debug_insn (val);
5710 if (dump_file && (dump_flags & TDF_DETAILS))
5712 /* We can't dump the insn with a TREE where an RTX
5713 is expected. */
5714 if (GET_CODE (val) == VAR_LOCATION)
5716 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
5717 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5719 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5720 if (GET_CODE (val) == VAR_LOCATION)
5721 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5724 delink_debug_stmt:
5725 /* In order not to generate too many debug temporaries,
5726 we delink all uses of debug statements we already expanded.
5727 Therefore debug statements between definition and real
5728 use of TERed SSA names will continue to use the SSA name,
5729 and not be replaced with debug temps. */
5730 delink_stmt_imm_use (stmt);
5732 gsi = nsi;
5733 gsi_next (&nsi);
5734 if (gsi_end_p (nsi))
5735 break;
5736 stmt = gsi_stmt (nsi);
5737 if (!is_gimple_debug (stmt))
5738 break;
5741 set_curr_insn_location (sloc);
5743 else
5745 gcall *call_stmt = dyn_cast <gcall *> (stmt);
5746 if (call_stmt
5747 && gimple_call_tail_p (call_stmt)
5748 && disable_tail_calls)
5749 gimple_call_set_tail (call_stmt, false);
5751 if (call_stmt && gimple_call_tail_p (call_stmt))
5753 bool can_fallthru;
5754 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
5755 if (new_bb)
5757 if (can_fallthru)
5758 bb = new_bb;
5759 else
5760 return new_bb;
5763 else
5765 def_operand_p def_p;
5766 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5768 if (def_p != NULL)
5770 /* Ignore this stmt if it is in the list of
5771 replaceable expressions. */
5772 if (SA.values
5773 && bitmap_bit_p (SA.values,
5774 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5775 continue;
5777 last = expand_gimple_stmt (stmt);
5778 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5783 currently_expanding_gimple_stmt = NULL;
5785 /* Expand implicit goto and convert goto_locus. */
5786 FOR_EACH_EDGE (e, ei, bb->succs)
5788 if (e->goto_locus != UNKNOWN_LOCATION)
5789 set_curr_insn_location (e->goto_locus);
5790 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5792 emit_jump (label_rtx_for_bb (e->dest));
5793 e->flags &= ~EDGE_FALLTHRU;
5797 /* Expanded RTL can create a jump in the last instruction of block.
5798 This later might be assumed to be a jump to successor and break edge insertion.
5799 We need to insert dummy move to prevent this. PR41440. */
5800 if (single_succ_p (bb)
5801 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5802 && (last = get_last_insn ())
5803 && (JUMP_P (last)
5804 || (DEBUG_INSN_P (last)
5805 && JUMP_P (prev_nondebug_insn (last)))))
5807 rtx dummy = gen_reg_rtx (SImode);
5808 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5811 do_pending_stack_adjust ();
5813 /* Find the block tail. The last insn in the block is the insn
5814 before a barrier and/or table jump insn. */
5815 last = get_last_insn ();
5816 if (BARRIER_P (last))
5817 last = PREV_INSN (last);
5818 if (JUMP_TABLE_DATA_P (last))
5819 last = PREV_INSN (PREV_INSN (last));
5820 if (BARRIER_P (last))
5821 last = PREV_INSN (last);
5822 BB_END (bb) = last;
5824 update_bb_for_insn (bb);
5826 return bb;
5830 /* Create a basic block for initialization code. */
5832 static basic_block
5833 construct_init_block (void)
5835 basic_block init_block, first_block;
5836 edge e = NULL;
5837 int flags;
5839 /* Multiple entry points not supported yet. */
5840 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5841 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5842 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5843 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5844 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5846 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5848 /* When entry edge points to first basic block, we don't need jump,
5849 otherwise we have to jump into proper target. */
5850 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5852 tree label = gimple_block_label (e->dest);
5854 emit_jump (jump_target_rtx (label));
5855 flags = 0;
5857 else
5858 flags = EDGE_FALLTHRU;
5860 init_block = create_basic_block (NEXT_INSN (get_insns ()),
5861 get_last_insn (),
5862 ENTRY_BLOCK_PTR_FOR_FN (cfun));
5863 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5864 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5865 if (e)
5867 first_block = e->dest;
5868 redirect_edge_succ (e, init_block);
5869 e = make_single_succ_edge (init_block, first_block, flags);
5871 else
5872 e = make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5873 EDGE_FALLTHRU);
5875 update_bb_for_insn (init_block);
5876 return init_block;
5879 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
5880 found in the block tree. */
5882 static void
5883 set_block_levels (tree block, int level)
5885 while (block)
5887 BLOCK_NUMBER (block) = level;
5888 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
5889 block = BLOCK_CHAIN (block);
5893 /* Create a block containing landing pads and similar stuff. */
5895 static void
5896 construct_exit_block (void)
5898 rtx_insn *head = get_last_insn ();
5899 rtx_insn *end;
5900 basic_block exit_block;
5901 edge e, e2;
5902 unsigned ix;
5903 edge_iterator ei;
5904 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
5905 rtx_insn *orig_end = BB_END (prev_bb);
5907 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5909 /* Make sure the locus is set to the end of the function, so that
5910 epilogue line numbers and warnings are set properly. */
5911 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
5912 input_location = cfun->function_end_locus;
5914 /* Generate rtl for function exit. */
5915 expand_function_end ();
5917 end = get_last_insn ();
5918 if (head == end)
5919 return;
5920 /* While emitting the function end we could move end of the last basic
5921 block. */
5922 BB_END (prev_bb) = orig_end;
5923 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
5924 head = NEXT_INSN (head);
5925 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
5926 bb count counting will be confused. Any instructions before that
5927 label are emitted for the case where PREV_BB falls through into the
5928 exit block, so append those instructions to prev_bb in that case. */
5929 if (NEXT_INSN (head) != return_label)
5931 while (NEXT_INSN (head) != return_label)
5933 if (!NOTE_P (NEXT_INSN (head)))
5934 BB_END (prev_bb) = NEXT_INSN (head);
5935 head = NEXT_INSN (head);
5938 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
5939 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5940 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5942 ix = 0;
5943 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
5945 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
5946 if (!(e->flags & EDGE_ABNORMAL))
5947 redirect_edge_succ (e, exit_block);
5948 else
5949 ix++;
5952 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5953 EDGE_FALLTHRU);
5954 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
5955 if (e2 != e)
5957 exit_block->count -= e2->count ();
5959 update_bb_for_insn (exit_block);
5962 /* Helper function for discover_nonconstant_array_refs.
5963 Look for ARRAY_REF nodes with non-constant indexes and mark them
5964 addressable. */
5966 static tree
5967 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
5968 void *data ATTRIBUTE_UNUSED)
5970 tree t = *tp;
5972 if (IS_TYPE_OR_DECL_P (t))
5973 *walk_subtrees = 0;
5974 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5976 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5977 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
5978 && (!TREE_OPERAND (t, 2)
5979 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5980 || (TREE_CODE (t) == COMPONENT_REF
5981 && (!TREE_OPERAND (t,2)
5982 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5983 || TREE_CODE (t) == BIT_FIELD_REF
5984 || TREE_CODE (t) == REALPART_EXPR
5985 || TREE_CODE (t) == IMAGPART_EXPR
5986 || TREE_CODE (t) == VIEW_CONVERT_EXPR
5987 || CONVERT_EXPR_P (t))
5988 t = TREE_OPERAND (t, 0);
5990 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5992 t = get_base_address (t);
5993 if (t && DECL_P (t)
5994 && DECL_MODE (t) != BLKmode)
5995 TREE_ADDRESSABLE (t) = 1;
5998 *walk_subtrees = 0;
6001 return NULL_TREE;
6004 /* RTL expansion is not able to compile array references with variable
6005 offsets for arrays stored in single register. Discover such
6006 expressions and mark variables as addressable to avoid this
6007 scenario. */
6009 static void
6010 discover_nonconstant_array_refs (void)
6012 basic_block bb;
6013 gimple_stmt_iterator gsi;
6015 FOR_EACH_BB_FN (bb, cfun)
6016 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6018 gimple *stmt = gsi_stmt (gsi);
6019 if (!is_gimple_debug (stmt))
6020 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
6024 /* This function sets crtl->args.internal_arg_pointer to a virtual
6025 register if DRAP is needed. Local register allocator will replace
6026 virtual_incoming_args_rtx with the virtual register. */
6028 static void
6029 expand_stack_alignment (void)
6031 rtx drap_rtx;
6032 unsigned int preferred_stack_boundary;
6034 if (! SUPPORTS_STACK_ALIGNMENT)
6035 return;
6037 if (cfun->calls_alloca
6038 || cfun->has_nonlocal_label
6039 || crtl->has_nonlocal_goto)
6040 crtl->need_drap = true;
6042 /* Call update_stack_boundary here again to update incoming stack
6043 boundary. It may set incoming stack alignment to a different
6044 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6045 use the minimum incoming stack alignment to check if it is OK
6046 to perform sibcall optimization since sibcall optimization will
6047 only align the outgoing stack to incoming stack boundary. */
6048 if (targetm.calls.update_stack_boundary)
6049 targetm.calls.update_stack_boundary ();
6051 /* The incoming stack frame has to be aligned at least at
6052 parm_stack_boundary. */
6053 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6055 /* Update crtl->stack_alignment_estimated and use it later to align
6056 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6057 exceptions since callgraph doesn't collect incoming stack alignment
6058 in this case. */
6059 if (cfun->can_throw_non_call_exceptions
6060 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6061 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6062 else
6063 preferred_stack_boundary = crtl->preferred_stack_boundary;
6064 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6065 crtl->stack_alignment_estimated = preferred_stack_boundary;
6066 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6067 crtl->stack_alignment_needed = preferred_stack_boundary;
6069 gcc_assert (crtl->stack_alignment_needed
6070 <= crtl->stack_alignment_estimated);
6072 crtl->stack_realign_needed
6073 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6074 crtl->stack_realign_tried = crtl->stack_realign_needed;
6076 crtl->stack_realign_processed = true;
6078 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6079 alignment. */
6080 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6081 drap_rtx = targetm.calls.get_drap_rtx ();
6083 /* stack_realign_drap and drap_rtx must match. */
6084 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6086 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6087 if (drap_rtx != NULL)
6089 crtl->args.internal_arg_pointer = drap_rtx;
6091 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6092 needed. */
6093 fixup_tail_calls ();
6098 static void
6099 expand_main_function (void)
6101 #if (defined(INVOKE__main) \
6102 || (!defined(HAS_INIT_SECTION) \
6103 && !defined(INIT_SECTION_ASM_OP) \
6104 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6105 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6106 #endif
6110 /* Expand code to initialize the stack_protect_guard. This is invoked at
6111 the beginning of a function to be protected. */
6113 static void
6114 stack_protect_prologue (void)
6116 tree guard_decl = targetm.stack_protect_guard ();
6117 rtx x, y;
6119 x = expand_normal (crtl->stack_protect_guard);
6120 if (guard_decl)
6121 y = expand_normal (guard_decl);
6122 else
6123 y = const0_rtx;
6125 /* Allow the target to copy from Y to X without leaking Y into a
6126 register. */
6127 if (targetm.have_stack_protect_set ())
6128 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6130 emit_insn (insn);
6131 return;
6134 /* Otherwise do a straight move. */
6135 emit_move_insn (x, y);
6138 /* Translate the intermediate representation contained in the CFG
6139 from GIMPLE trees to RTL.
6141 We do conversion per basic block and preserve/update the tree CFG.
6142 This implies we have to do some magic as the CFG can simultaneously
6143 consist of basic blocks containing RTL and GIMPLE trees. This can
6144 confuse the CFG hooks, so be careful to not manipulate CFG during
6145 the expansion. */
6147 namespace {
6149 const pass_data pass_data_expand =
6151 RTL_PASS, /* type */
6152 "expand", /* name */
6153 OPTGROUP_NONE, /* optinfo_flags */
6154 TV_EXPAND, /* tv_id */
6155 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6156 | PROP_gimple_lcx
6157 | PROP_gimple_lvec
6158 | PROP_gimple_lva), /* properties_required */
6159 PROP_rtl, /* properties_provided */
6160 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
6161 0, /* todo_flags_start */
6162 0, /* todo_flags_finish */
6165 class pass_expand : public rtl_opt_pass
6167 public:
6168 pass_expand (gcc::context *ctxt)
6169 : rtl_opt_pass (pass_data_expand, ctxt)
6172 /* opt_pass methods: */
6173 virtual unsigned int execute (function *);
6175 }; // class pass_expand
6177 unsigned int
6178 pass_expand::execute (function *fun)
6180 basic_block bb, init_block;
6181 edge_iterator ei;
6182 edge e;
6183 rtx_insn *var_seq, *var_ret_seq;
6184 unsigned i;
6186 timevar_push (TV_OUT_OF_SSA);
6187 rewrite_out_of_ssa (&SA);
6188 timevar_pop (TV_OUT_OF_SSA);
6189 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6191 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6193 gimple_stmt_iterator gsi;
6194 FOR_EACH_BB_FN (bb, cfun)
6195 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6196 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6197 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6200 /* Make sure all values used by the optimization passes have sane
6201 defaults. */
6202 reg_renumber = 0;
6204 /* Some backends want to know that we are expanding to RTL. */
6205 currently_expanding_to_rtl = 1;
6206 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6207 free_dominance_info (CDI_DOMINATORS);
6209 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6211 insn_locations_init ();
6212 if (!DECL_IS_BUILTIN (current_function_decl))
6214 /* Eventually, all FEs should explicitly set function_start_locus. */
6215 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6216 set_curr_insn_location
6217 (DECL_SOURCE_LOCATION (current_function_decl));
6218 else
6219 set_curr_insn_location (fun->function_start_locus);
6221 else
6222 set_curr_insn_location (UNKNOWN_LOCATION);
6223 prologue_location = curr_insn_location ();
6225 #ifdef INSN_SCHEDULING
6226 init_sched_attrs ();
6227 #endif
6229 /* Make sure first insn is a note even if we don't want linenums.
6230 This makes sure the first insn will never be deleted.
6231 Also, final expects a note to appear there. */
6232 emit_note (NOTE_INSN_DELETED);
6234 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6235 discover_nonconstant_array_refs ();
6237 targetm.expand_to_rtl_hook ();
6238 crtl->init_stack_alignment ();
6239 fun->cfg->max_jumptable_ents = 0;
6241 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6242 of the function section at exapnsion time to predict distance of calls. */
6243 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6245 /* Expand the variables recorded during gimple lowering. */
6246 timevar_push (TV_VAR_EXPAND);
6247 start_sequence ();
6249 var_ret_seq = expand_used_vars ();
6251 var_seq = get_insns ();
6252 end_sequence ();
6253 timevar_pop (TV_VAR_EXPAND);
6255 /* Honor stack protection warnings. */
6256 if (warn_stack_protect)
6258 if (fun->calls_alloca)
6259 warning (OPT_Wstack_protector,
6260 "stack protector not protecting local variables: "
6261 "variable length buffer");
6262 if (has_short_buffer && !crtl->stack_protect_guard)
6263 warning (OPT_Wstack_protector,
6264 "stack protector not protecting function: "
6265 "all local arrays are less than %d bytes long",
6266 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE));
6269 /* Set up parameters and prepare for return, for the function. */
6270 expand_function_start (current_function_decl);
6272 /* If we emitted any instructions for setting up the variables,
6273 emit them before the FUNCTION_START note. */
6274 if (var_seq)
6276 emit_insn_before (var_seq, parm_birth_insn);
6278 /* In expand_function_end we'll insert the alloca save/restore
6279 before parm_birth_insn. We've just insertted an alloca call.
6280 Adjust the pointer to match. */
6281 parm_birth_insn = var_seq;
6284 /* Now propagate the RTL assignment of each partition to the
6285 underlying var of each SSA_NAME. */
6286 tree name;
6288 FOR_EACH_SSA_NAME (i, name, cfun)
6290 /* We might have generated new SSA names in
6291 update_alias_info_with_stack_vars. They will have a NULL
6292 defining statements, and won't be part of the partitioning,
6293 so ignore those. */
6294 if (!SSA_NAME_DEF_STMT (name))
6295 continue;
6297 adjust_one_expanded_partition_var (name);
6300 /* Clean up RTL of variables that straddle across multiple
6301 partitions, and check that the rtl of any PARM_DECLs that are not
6302 cleaned up is that of their default defs. */
6303 FOR_EACH_SSA_NAME (i, name, cfun)
6305 int part;
6307 /* We might have generated new SSA names in
6308 update_alias_info_with_stack_vars. They will have a NULL
6309 defining statements, and won't be part of the partitioning,
6310 so ignore those. */
6311 if (!SSA_NAME_DEF_STMT (name))
6312 continue;
6313 part = var_to_partition (SA.map, name);
6314 if (part == NO_PARTITION)
6315 continue;
6317 /* If this decl was marked as living in multiple places, reset
6318 this now to NULL. */
6319 tree var = SSA_NAME_VAR (name);
6320 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6321 SET_DECL_RTL (var, NULL);
6322 /* Check that the pseudos chosen by assign_parms are those of
6323 the corresponding default defs. */
6324 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6325 && (TREE_CODE (var) == PARM_DECL
6326 || TREE_CODE (var) == RESULT_DECL))
6328 rtx in = DECL_RTL_IF_SET (var);
6329 gcc_assert (in);
6330 rtx out = SA.partition_to_pseudo[part];
6331 gcc_assert (in == out);
6333 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6334 those expected by debug backends for each parm and for
6335 the result. This is particularly important for stabs,
6336 whose register elimination from parm's DECL_RTL may cause
6337 -fcompare-debug differences as SET_DECL_RTL changes reg's
6338 attrs. So, make sure the RTL already has the parm as the
6339 EXPR, so that it won't change. */
6340 SET_DECL_RTL (var, NULL_RTX);
6341 if (MEM_P (in))
6342 set_mem_attributes (in, var, true);
6343 SET_DECL_RTL (var, in);
6347 /* If this function is `main', emit a call to `__main'
6348 to run global initializers, etc. */
6349 if (DECL_NAME (current_function_decl)
6350 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6351 && DECL_FILE_SCOPE_P (current_function_decl))
6352 expand_main_function ();
6354 /* Initialize the stack_protect_guard field. This must happen after the
6355 call to __main (if any) so that the external decl is initialized. */
6356 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6357 stack_protect_prologue ();
6359 expand_phi_nodes (&SA);
6361 /* Release any stale SSA redirection data. */
6362 redirect_edge_var_map_empty ();
6364 /* Register rtl specific functions for cfg. */
6365 rtl_register_cfg_hooks ();
6367 init_block = construct_init_block ();
6369 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6370 remaining edges later. */
6371 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6372 e->flags &= ~EDGE_EXECUTABLE;
6374 /* If the function has too many markers, drop them while expanding. */
6375 if (cfun->debug_marker_count
6376 >= PARAM_VALUE (PARAM_MAX_DEBUG_MARKER_COUNT))
6377 cfun->debug_nonbind_markers = false;
6379 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6380 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6381 next_bb)
6382 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6384 if (MAY_HAVE_DEBUG_BIND_INSNS)
6385 expand_debug_locations ();
6387 if (deep_ter_debug_map)
6389 delete deep_ter_debug_map;
6390 deep_ter_debug_map = NULL;
6393 /* Free stuff we no longer need after GIMPLE optimizations. */
6394 free_dominance_info (CDI_DOMINATORS);
6395 free_dominance_info (CDI_POST_DOMINATORS);
6396 delete_tree_cfg_annotations (fun);
6398 timevar_push (TV_OUT_OF_SSA);
6399 finish_out_of_ssa (&SA);
6400 timevar_pop (TV_OUT_OF_SSA);
6402 timevar_push (TV_POST_EXPAND);
6403 /* We are no longer in SSA form. */
6404 fun->gimple_df->in_ssa_p = false;
6405 loops_state_clear (LOOP_CLOSED_SSA);
6407 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6408 conservatively to true until they are all profile aware. */
6409 delete lab_rtx_for_bb;
6410 free_histograms (fun);
6412 construct_exit_block ();
6413 insn_locations_finalize ();
6415 if (var_ret_seq)
6417 rtx_insn *after = return_label;
6418 rtx_insn *next = NEXT_INSN (after);
6419 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6420 after = next;
6421 emit_insn_after (var_ret_seq, after);
6424 /* Zap the tree EH table. */
6425 set_eh_throw_stmt_table (fun, NULL);
6427 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6428 split edges which edge insertions might do. */
6429 rebuild_jump_labels (get_insns ());
6431 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun),
6432 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6434 edge e;
6435 edge_iterator ei;
6436 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6438 if (e->insns.r)
6440 rebuild_jump_labels_chain (e->insns.r);
6441 /* Put insns after parm birth, but before
6442 NOTE_INSNS_FUNCTION_BEG. */
6443 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (fun)
6444 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6446 rtx_insn *insns = e->insns.r;
6447 e->insns.r = NULL;
6448 if (NOTE_P (parm_birth_insn)
6449 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6450 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6451 else
6452 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6454 else
6455 commit_one_edge_insertion (e);
6457 else
6458 ei_next (&ei);
6462 /* We're done expanding trees to RTL. */
6463 currently_expanding_to_rtl = 0;
6465 flush_mark_addressable_queue ();
6467 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6468 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6470 edge e;
6471 edge_iterator ei;
6472 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6474 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6475 e->flags &= ~EDGE_EXECUTABLE;
6477 /* At the moment not all abnormal edges match the RTL
6478 representation. It is safe to remove them here as
6479 find_many_sub_basic_blocks will rediscover them.
6480 In the future we should get this fixed properly. */
6481 if ((e->flags & EDGE_ABNORMAL)
6482 && !(e->flags & EDGE_SIBCALL))
6483 remove_edge (e);
6484 else
6485 ei_next (&ei);
6489 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6490 bitmap_ones (blocks);
6491 find_many_sub_basic_blocks (blocks);
6492 purge_all_dead_edges ();
6494 expand_stack_alignment ();
6496 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6497 function. */
6498 if (crtl->tail_call_emit)
6499 fixup_tail_calls ();
6501 /* After initial rtl generation, call back to finish generating
6502 exception support code. We need to do this before cleaning up
6503 the CFG as the code does not expect dead landing pads. */
6504 if (fun->eh->region_tree != NULL)
6505 finish_eh_generation ();
6507 /* BB subdivision may have created basic blocks that are are only reachable
6508 from unlikely bbs but not marked as such in the profile. */
6509 if (optimize)
6510 propagate_unlikely_bbs_forward ();
6512 /* Remove unreachable blocks, otherwise we cannot compute dominators
6513 which are needed for loop state verification. As a side-effect
6514 this also compacts blocks.
6515 ??? We cannot remove trivially dead insns here as for example
6516 the DRAP reg on i?86 is not magically live at this point.
6517 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6518 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6520 checking_verify_flow_info ();
6522 /* Initialize pseudos allocated for hard registers. */
6523 emit_initial_value_sets ();
6525 /* And finally unshare all RTL. */
6526 unshare_all_rtl ();
6528 /* There's no need to defer outputting this function any more; we
6529 know we want to output it. */
6530 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6532 /* Now that we're done expanding trees to RTL, we shouldn't have any
6533 more CONCATs anywhere. */
6534 generating_concat_p = 0;
6536 if (dump_file)
6538 fprintf (dump_file,
6539 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6540 /* And the pass manager will dump RTL for us. */
6543 /* If we're emitting a nested function, make sure its parent gets
6544 emitted as well. Doing otherwise confuses debug info. */
6546 tree parent;
6547 for (parent = DECL_CONTEXT (current_function_decl);
6548 parent != NULL_TREE;
6549 parent = get_containing_scope (parent))
6550 if (TREE_CODE (parent) == FUNCTION_DECL)
6551 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6554 TREE_ASM_WRITTEN (current_function_decl) = 1;
6556 /* After expanding, the return labels are no longer needed. */
6557 return_label = NULL;
6558 naked_return_label = NULL;
6560 /* After expanding, the tm_restart map is no longer needed. */
6561 if (fun->gimple_df->tm_restart)
6562 fun->gimple_df->tm_restart = NULL;
6564 /* Tag the blocks with a depth number so that change_scope can find
6565 the common parent easily. */
6566 set_block_levels (DECL_INITIAL (fun->decl), 0);
6567 default_rtl_profile ();
6569 /* For -dx discard loops now, otherwise IL verify in clean_state will
6570 ICE. */
6571 if (rtl_dump_and_exit)
6573 cfun->curr_properties &= ~PROP_loops;
6574 loop_optimizer_finalize ();
6577 timevar_pop (TV_POST_EXPAND);
6579 return 0;
6582 } // anon namespace
6584 rtl_opt_pass *
6585 make_pass_expand (gcc::context *ctxt)
6587 return new pass_expand (ctxt);