Add support for ARMv8-R architecture
[official-gcc.git] / gcc / cfgexpand.c
blob3b5f2fe270fda0214eb093c4defd92cd059ac1be
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2017 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "params.h"
65 #include "tree-inline.h"
66 #include "value-prof.h"
67 #include "tree-ssa-live.h"
68 #include "tree-outof-ssa.h"
69 #include "cfgloop.h"
70 #include "insn-attr.h" /* For INSN_SCHEDULING. */
71 #include "asan.h"
72 #include "tree-ssa-address.h"
73 #include "output.h"
74 #include "builtins.h"
75 #include "tree-chkp.h"
76 #include "rtl-chkp.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 enum gimple_rhs_class grhs_class;
109 grhs_class = get_gimple_rhs_class (gimple_expr_code (stmt));
111 if (grhs_class == GIMPLE_TERNARY_RHS)
112 t = build3 (gimple_assign_rhs_code (stmt),
113 TREE_TYPE (gimple_assign_lhs (stmt)),
114 gimple_assign_rhs1 (stmt),
115 gimple_assign_rhs2 (stmt),
116 gimple_assign_rhs3 (stmt));
117 else if (grhs_class == GIMPLE_BINARY_RHS)
118 t = build2 (gimple_assign_rhs_code (stmt),
119 TREE_TYPE (gimple_assign_lhs (stmt)),
120 gimple_assign_rhs1 (stmt),
121 gimple_assign_rhs2 (stmt));
122 else if (grhs_class == GIMPLE_UNARY_RHS)
123 t = build1 (gimple_assign_rhs_code (stmt),
124 TREE_TYPE (gimple_assign_lhs (stmt)),
125 gimple_assign_rhs1 (stmt));
126 else if (grhs_class == GIMPLE_SINGLE_RHS)
128 t = gimple_assign_rhs1 (stmt);
129 /* Avoid modifying this tree in place below. */
130 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
131 && gimple_location (stmt) != EXPR_LOCATION (t))
132 || (gimple_block (stmt)
133 && currently_expanding_to_rtl
134 && EXPR_P (t)))
135 t = copy_node (t);
137 else
138 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 struct stack_var
310 /* The Variable. */
311 tree decl;
313 /* Initially, the size of the variable. Later, the size of the partition,
314 if this variable becomes it's partition's representative. */
315 HOST_WIDE_INT size;
317 /* The *byte* alignment required for this variable. Or as, with the
318 size, the alignment for this partition. */
319 unsigned int alignb;
321 /* The partition representative. */
322 size_t representative;
324 /* The next stack variable in the partition, or EOC. */
325 size_t next;
327 /* The numbers of conflicting stack variables. */
328 bitmap conflicts;
331 #define EOC ((size_t)-1)
333 /* We have an array of such objects while deciding allocation. */
334 static struct stack_var *stack_vars;
335 static size_t stack_vars_alloc;
336 static size_t stack_vars_num;
337 static hash_map<tree, size_t> *decl_to_stack_part;
339 /* Conflict bitmaps go on this obstack. This allows us to destroy
340 all of them in one big sweep. */
341 static bitmap_obstack stack_var_bitmap_obstack;
343 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
344 is non-decreasing. */
345 static size_t *stack_vars_sorted;
347 /* The phase of the stack frame. This is the known misalignment of
348 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
349 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
350 static int frame_phase;
352 /* Used during expand_used_vars to remember if we saw any decls for
353 which we'd like to enable stack smashing protection. */
354 static bool has_protected_decls;
356 /* Used during expand_used_vars. Remember if we say a character buffer
357 smaller than our cutoff threshold. Used for -Wstack-protector. */
358 static bool has_short_buffer;
360 /* Compute the byte alignment to use for DECL. Ignore alignment
361 we can't do with expected alignment of the stack boundary. */
363 static unsigned int
364 align_local_variable (tree decl)
366 unsigned int align;
368 if (TREE_CODE (decl) == SSA_NAME)
369 align = TYPE_ALIGN (TREE_TYPE (decl));
370 else
372 align = LOCAL_DECL_ALIGNMENT (decl);
373 SET_DECL_ALIGN (decl, align);
375 return align / BITS_PER_UNIT;
378 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
379 down otherwise. Return truncated BASE value. */
381 static inline unsigned HOST_WIDE_INT
382 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
384 return align_up ? (base + align - 1) & -align : base & -align;
387 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
388 Return the frame offset. */
390 static HOST_WIDE_INT
391 alloc_stack_frame_space (HOST_WIDE_INT size, unsigned HOST_WIDE_INT align)
393 HOST_WIDE_INT offset, new_frame_offset;
395 if (FRAME_GROWS_DOWNWARD)
397 new_frame_offset
398 = align_base (frame_offset - frame_phase - size,
399 align, false) + frame_phase;
400 offset = new_frame_offset;
402 else
404 new_frame_offset
405 = align_base (frame_offset - frame_phase, align, true) + frame_phase;
406 offset = new_frame_offset;
407 new_frame_offset += size;
409 frame_offset = new_frame_offset;
411 if (frame_offset_overflow (frame_offset, cfun->decl))
412 frame_offset = offset = 0;
414 return offset;
417 /* Accumulate DECL into STACK_VARS. */
419 static void
420 add_stack_var (tree decl)
422 struct stack_var *v;
424 if (stack_vars_num >= stack_vars_alloc)
426 if (stack_vars_alloc)
427 stack_vars_alloc = stack_vars_alloc * 3 / 2;
428 else
429 stack_vars_alloc = 32;
430 stack_vars
431 = XRESIZEVEC (struct stack_var, stack_vars, stack_vars_alloc);
433 if (!decl_to_stack_part)
434 decl_to_stack_part = new hash_map<tree, size_t>;
436 v = &stack_vars[stack_vars_num];
437 decl_to_stack_part->put (decl, stack_vars_num);
439 v->decl = decl;
440 tree size = TREE_CODE (decl) == SSA_NAME
441 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
442 : DECL_SIZE_UNIT (decl);
443 v->size = tree_to_uhwi (size);
444 /* Ensure that all variables have size, so that &a != &b for any two
445 variables that are simultaneously live. */
446 if (v->size == 0)
447 v->size = 1;
448 v->alignb = align_local_variable (decl);
449 /* An alignment of zero can mightily confuse us later. */
450 gcc_assert (v->alignb != 0);
452 /* All variables are initially in their own partition. */
453 v->representative = stack_vars_num;
454 v->next = EOC;
456 /* All variables initially conflict with no other. */
457 v->conflicts = NULL;
459 /* Ensure that this decl doesn't get put onto the list twice. */
460 set_rtl (decl, pc_rtx);
462 stack_vars_num++;
465 /* Make the decls associated with luid's X and Y conflict. */
467 static void
468 add_stack_var_conflict (size_t x, size_t y)
470 struct stack_var *a = &stack_vars[x];
471 struct stack_var *b = &stack_vars[y];
472 if (!a->conflicts)
473 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
474 if (!b->conflicts)
475 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
476 bitmap_set_bit (a->conflicts, y);
477 bitmap_set_bit (b->conflicts, x);
480 /* Check whether the decls associated with luid's X and Y conflict. */
482 static bool
483 stack_var_conflict_p (size_t x, size_t y)
485 struct stack_var *a = &stack_vars[x];
486 struct stack_var *b = &stack_vars[y];
487 if (x == y)
488 return false;
489 /* Partitions containing an SSA name result from gimple registers
490 with things like unsupported modes. They are top-level and
491 hence conflict with everything else. */
492 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
493 return true;
495 if (!a->conflicts || !b->conflicts)
496 return false;
497 return bitmap_bit_p (a->conflicts, y);
500 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
501 enter its partition number into bitmap DATA. */
503 static bool
504 visit_op (gimple *, tree op, tree, void *data)
506 bitmap active = (bitmap)data;
507 op = get_base_address (op);
508 if (op
509 && DECL_P (op)
510 && DECL_RTL_IF_SET (op) == pc_rtx)
512 size_t *v = decl_to_stack_part->get (op);
513 if (v)
514 bitmap_set_bit (active, *v);
516 return false;
519 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
520 record conflicts between it and all currently active other partitions
521 from bitmap DATA. */
523 static bool
524 visit_conflict (gimple *, tree op, tree, void *data)
526 bitmap active = (bitmap)data;
527 op = get_base_address (op);
528 if (op
529 && DECL_P (op)
530 && DECL_RTL_IF_SET (op) == pc_rtx)
532 size_t *v = decl_to_stack_part->get (op);
533 if (v && bitmap_set_bit (active, *v))
535 size_t num = *v;
536 bitmap_iterator bi;
537 unsigned i;
538 gcc_assert (num < stack_vars_num);
539 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
540 add_stack_var_conflict (num, i);
543 return false;
546 /* Helper routine for add_scope_conflicts, calculating the active partitions
547 at the end of BB, leaving the result in WORK. We're called to generate
548 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
549 liveness. */
551 static void
552 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
554 edge e;
555 edge_iterator ei;
556 gimple_stmt_iterator gsi;
557 walk_stmt_load_store_addr_fn visit;
559 bitmap_clear (work);
560 FOR_EACH_EDGE (e, ei, bb->preds)
561 bitmap_ior_into (work, (bitmap)e->src->aux);
563 visit = visit_op;
565 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
567 gimple *stmt = gsi_stmt (gsi);
568 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
570 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
572 gimple *stmt = gsi_stmt (gsi);
574 if (gimple_clobber_p (stmt))
576 tree lhs = gimple_assign_lhs (stmt);
577 size_t *v;
578 /* Nested function lowering might introduce LHSs
579 that are COMPONENT_REFs. */
580 if (!VAR_P (lhs))
581 continue;
582 if (DECL_RTL_IF_SET (lhs) == pc_rtx
583 && (v = decl_to_stack_part->get (lhs)))
584 bitmap_clear_bit (work, *v);
586 else if (!is_gimple_debug (stmt))
588 if (for_conflict
589 && visit == visit_op)
591 /* If this is the first real instruction in this BB we need
592 to add conflicts for everything live at this point now.
593 Unlike classical liveness for named objects we can't
594 rely on seeing a def/use of the names we're interested in.
595 There might merely be indirect loads/stores. We'd not add any
596 conflicts for such partitions. */
597 bitmap_iterator bi;
598 unsigned i;
599 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
601 struct stack_var *a = &stack_vars[i];
602 if (!a->conflicts)
603 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
604 bitmap_ior_into (a->conflicts, work);
606 visit = visit_conflict;
608 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
613 /* Generate stack partition conflicts between all partitions that are
614 simultaneously live. */
616 static void
617 add_scope_conflicts (void)
619 basic_block bb;
620 bool changed;
621 bitmap work = BITMAP_ALLOC (NULL);
622 int *rpo;
623 int n_bbs;
625 /* We approximate the live range of a stack variable by taking the first
626 mention of its name as starting point(s), and by the end-of-scope
627 death clobber added by gimplify as ending point(s) of the range.
628 This overapproximates in the case we for instance moved an address-taken
629 operation upward, without also moving a dereference to it upwards.
630 But it's conservatively correct as a variable never can hold values
631 before its name is mentioned at least once.
633 We then do a mostly classical bitmap liveness algorithm. */
635 FOR_ALL_BB_FN (bb, cfun)
636 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
638 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
639 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
641 changed = true;
642 while (changed)
644 int i;
645 changed = false;
646 for (i = 0; i < n_bbs; i++)
648 bitmap active;
649 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
650 active = (bitmap)bb->aux;
651 add_scope_conflicts_1 (bb, work, false);
652 if (bitmap_ior_into (active, work))
653 changed = true;
657 FOR_EACH_BB_FN (bb, cfun)
658 add_scope_conflicts_1 (bb, work, true);
660 free (rpo);
661 BITMAP_FREE (work);
662 FOR_ALL_BB_FN (bb, cfun)
663 BITMAP_FREE (bb->aux);
666 /* A subroutine of partition_stack_vars. A comparison function for qsort,
667 sorting an array of indices by the properties of the object. */
669 static int
670 stack_var_cmp (const void *a, const void *b)
672 size_t ia = *(const size_t *)a;
673 size_t ib = *(const size_t *)b;
674 unsigned int aligna = stack_vars[ia].alignb;
675 unsigned int alignb = stack_vars[ib].alignb;
676 HOST_WIDE_INT sizea = stack_vars[ia].size;
677 HOST_WIDE_INT sizeb = stack_vars[ib].size;
678 tree decla = stack_vars[ia].decl;
679 tree declb = stack_vars[ib].decl;
680 bool largea, largeb;
681 unsigned int uida, uidb;
683 /* Primary compare on "large" alignment. Large comes first. */
684 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
685 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
686 if (largea != largeb)
687 return (int)largeb - (int)largea;
689 /* Secondary compare on size, decreasing */
690 if (sizea > sizeb)
691 return -1;
692 if (sizea < sizeb)
693 return 1;
695 /* Tertiary compare on true alignment, decreasing. */
696 if (aligna < alignb)
697 return -1;
698 if (aligna > alignb)
699 return 1;
701 /* Final compare on ID for sort stability, increasing.
702 Two SSA names are compared by their version, SSA names come before
703 non-SSA names, and two normal decls are compared by their DECL_UID. */
704 if (TREE_CODE (decla) == SSA_NAME)
706 if (TREE_CODE (declb) == SSA_NAME)
707 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
708 else
709 return -1;
711 else if (TREE_CODE (declb) == SSA_NAME)
712 return 1;
713 else
714 uida = DECL_UID (decla), uidb = DECL_UID (declb);
715 if (uida < uidb)
716 return 1;
717 if (uida > uidb)
718 return -1;
719 return 0;
722 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
723 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
725 /* If the points-to solution *PI points to variables that are in a partition
726 together with other variables add all partition members to the pointed-to
727 variables bitmap. */
729 static void
730 add_partitioned_vars_to_ptset (struct pt_solution *pt,
731 part_hashmap *decls_to_partitions,
732 hash_set<bitmap> *visited, bitmap temp)
734 bitmap_iterator bi;
735 unsigned i;
736 bitmap *part;
738 if (pt->anything
739 || pt->vars == NULL
740 /* The pointed-to vars bitmap is shared, it is enough to
741 visit it once. */
742 || visited->add (pt->vars))
743 return;
745 bitmap_clear (temp);
747 /* By using a temporary bitmap to store all members of the partitions
748 we have to add we make sure to visit each of the partitions only
749 once. */
750 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
751 if ((!temp
752 || !bitmap_bit_p (temp, i))
753 && (part = decls_to_partitions->get (i)))
754 bitmap_ior_into (temp, *part);
755 if (!bitmap_empty_p (temp))
756 bitmap_ior_into (pt->vars, temp);
759 /* Update points-to sets based on partition info, so we can use them on RTL.
760 The bitmaps representing stack partitions will be saved until expand,
761 where partitioned decls used as bases in memory expressions will be
762 rewritten. */
764 static void
765 update_alias_info_with_stack_vars (void)
767 part_hashmap *decls_to_partitions = NULL;
768 size_t i, j;
769 tree var = NULL_TREE;
771 for (i = 0; i < stack_vars_num; i++)
773 bitmap part = NULL;
774 tree name;
775 struct ptr_info_def *pi;
777 /* Not interested in partitions with single variable. */
778 if (stack_vars[i].representative != i
779 || stack_vars[i].next == EOC)
780 continue;
782 if (!decls_to_partitions)
784 decls_to_partitions = new part_hashmap;
785 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
788 /* Create an SSA_NAME that points to the partition for use
789 as base during alias-oracle queries on RTL for bases that
790 have been partitioned. */
791 if (var == NULL_TREE)
792 var = create_tmp_var (ptr_type_node);
793 name = make_ssa_name (var);
795 /* Create bitmaps representing partitions. They will be used for
796 points-to sets later, so use GGC alloc. */
797 part = BITMAP_GGC_ALLOC ();
798 for (j = i; j != EOC; j = stack_vars[j].next)
800 tree decl = stack_vars[j].decl;
801 unsigned int uid = DECL_PT_UID (decl);
802 bitmap_set_bit (part, uid);
803 decls_to_partitions->put (uid, part);
804 cfun->gimple_df->decls_to_pointers->put (decl, name);
805 if (TREE_ADDRESSABLE (decl))
806 TREE_ADDRESSABLE (name) = 1;
809 /* Make the SSA name point to all partition members. */
810 pi = get_ptr_info (name);
811 pt_solution_set (&pi->pt, part, false);
814 /* Make all points-to sets that contain one member of a partition
815 contain all members of the partition. */
816 if (decls_to_partitions)
818 unsigned i;
819 tree name;
820 hash_set<bitmap> visited;
821 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
823 FOR_EACH_SSA_NAME (i, name, cfun)
825 struct ptr_info_def *pi;
827 if (POINTER_TYPE_P (TREE_TYPE (name))
828 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
829 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
830 &visited, temp);
833 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
834 decls_to_partitions, &visited, temp);
836 delete decls_to_partitions;
837 BITMAP_FREE (temp);
841 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
842 partitioning algorithm. Partitions A and B are known to be non-conflicting.
843 Merge them into a single partition A. */
845 static void
846 union_stack_vars (size_t a, size_t b)
848 struct stack_var *vb = &stack_vars[b];
849 bitmap_iterator bi;
850 unsigned u;
852 gcc_assert (stack_vars[b].next == EOC);
853 /* Add B to A's partition. */
854 stack_vars[b].next = stack_vars[a].next;
855 stack_vars[b].representative = a;
856 stack_vars[a].next = b;
858 /* Update the required alignment of partition A to account for B. */
859 if (stack_vars[a].alignb < stack_vars[b].alignb)
860 stack_vars[a].alignb = stack_vars[b].alignb;
862 /* Update the interference graph and merge the conflicts. */
863 if (vb->conflicts)
865 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
866 add_stack_var_conflict (a, stack_vars[u].representative);
867 BITMAP_FREE (vb->conflicts);
871 /* A subroutine of expand_used_vars. Binpack the variables into
872 partitions constrained by the interference graph. The overall
873 algorithm used is as follows:
875 Sort the objects by size in descending order.
876 For each object A {
877 S = size(A)
878 O = 0
879 loop {
880 Look for the largest non-conflicting object B with size <= S.
881 UNION (A, B)
886 static void
887 partition_stack_vars (void)
889 size_t si, sj, n = stack_vars_num;
891 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
892 for (si = 0; si < n; ++si)
893 stack_vars_sorted[si] = si;
895 if (n == 1)
896 return;
898 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
900 for (si = 0; si < n; ++si)
902 size_t i = stack_vars_sorted[si];
903 unsigned int ialign = stack_vars[i].alignb;
904 HOST_WIDE_INT isize = stack_vars[i].size;
906 /* Ignore objects that aren't partition representatives. If we
907 see a var that is not a partition representative, it must
908 have been merged earlier. */
909 if (stack_vars[i].representative != i)
910 continue;
912 for (sj = si + 1; sj < n; ++sj)
914 size_t j = stack_vars_sorted[sj];
915 unsigned int jalign = stack_vars[j].alignb;
916 HOST_WIDE_INT jsize = stack_vars[j].size;
918 /* Ignore objects that aren't partition representatives. */
919 if (stack_vars[j].representative != j)
920 continue;
922 /* Do not mix objects of "small" (supported) alignment
923 and "large" (unsupported) alignment. */
924 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
925 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
926 break;
928 /* For Address Sanitizer do not mix objects with different
929 sizes, as the shorter vars wouldn't be adequately protected.
930 Don't do that for "large" (unsupported) alignment objects,
931 those aren't protected anyway. */
932 if ((asan_sanitize_stack_p ())
933 && isize != jsize
934 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
935 break;
937 /* Ignore conflicting objects. */
938 if (stack_var_conflict_p (i, j))
939 continue;
941 /* UNION the objects, placing J at OFFSET. */
942 union_stack_vars (i, j);
946 update_alias_info_with_stack_vars ();
949 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
951 static void
952 dump_stack_var_partition (void)
954 size_t si, i, j, n = stack_vars_num;
956 for (si = 0; si < n; ++si)
958 i = stack_vars_sorted[si];
960 /* Skip variables that aren't partition representatives, for now. */
961 if (stack_vars[i].representative != i)
962 continue;
964 fprintf (dump_file, "Partition %lu: size " HOST_WIDE_INT_PRINT_DEC
965 " align %u\n", (unsigned long) i, stack_vars[i].size,
966 stack_vars[i].alignb);
968 for (j = i; j != EOC; j = stack_vars[j].next)
970 fputc ('\t', dump_file);
971 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
973 fputc ('\n', dump_file);
977 /* Assign rtl to DECL at BASE + OFFSET. */
979 static void
980 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
981 HOST_WIDE_INT offset)
983 unsigned align;
984 rtx x;
986 /* If this fails, we've overflowed the stack frame. Error nicely? */
987 gcc_assert (offset == trunc_int_for_mode (offset, Pmode));
989 x = plus_constant (Pmode, base, offset);
990 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
991 ? TYPE_MODE (TREE_TYPE (decl))
992 : DECL_MODE (SSAVAR (decl)), x);
994 if (TREE_CODE (decl) != SSA_NAME)
996 /* Set alignment we actually gave this decl if it isn't an SSA name.
997 If it is we generate stack slots only accidentally so it isn't as
998 important, we'll simply use the alignment that is already set. */
999 if (base == virtual_stack_vars_rtx)
1000 offset -= frame_phase;
1001 align = least_bit_hwi (offset);
1002 align *= BITS_PER_UNIT;
1003 if (align == 0 || align > base_align)
1004 align = base_align;
1006 /* One would think that we could assert that we're not decreasing
1007 alignment here, but (at least) the i386 port does exactly this
1008 via the MINIMUM_ALIGNMENT hook. */
1010 SET_DECL_ALIGN (decl, align);
1011 DECL_USER_ALIGN (decl) = 0;
1014 set_rtl (decl, x);
1017 struct stack_vars_data
1019 /* Vector of offset pairs, always end of some padding followed
1020 by start of the padding that needs Address Sanitizer protection.
1021 The vector is in reversed, highest offset pairs come first. */
1022 auto_vec<HOST_WIDE_INT> asan_vec;
1024 /* Vector of partition representative decls in between the paddings. */
1025 auto_vec<tree> asan_decl_vec;
1027 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1028 rtx asan_base;
1030 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1031 unsigned int asan_alignb;
1034 /* A subroutine of expand_used_vars. Give each partition representative
1035 a unique location within the stack frame. Update each partition member
1036 with that location. */
1038 static void
1039 expand_stack_vars (bool (*pred) (size_t), struct stack_vars_data *data)
1041 size_t si, i, j, n = stack_vars_num;
1042 HOST_WIDE_INT large_size = 0, large_alloc = 0;
1043 rtx large_base = NULL;
1044 unsigned large_align = 0;
1045 bool large_allocation_done = false;
1046 tree decl;
1048 /* Determine if there are any variables requiring "large" alignment.
1049 Since these are dynamically allocated, we only process these if
1050 no predicate involved. */
1051 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1052 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1054 /* Find the total size of these variables. */
1055 for (si = 0; si < n; ++si)
1057 unsigned alignb;
1059 i = stack_vars_sorted[si];
1060 alignb = stack_vars[i].alignb;
1062 /* All "large" alignment decls come before all "small" alignment
1063 decls, but "large" alignment decls are not sorted based on
1064 their alignment. Increase large_align to track the largest
1065 required alignment. */
1066 if ((alignb * BITS_PER_UNIT) > large_align)
1067 large_align = alignb * BITS_PER_UNIT;
1069 /* Stop when we get to the first decl with "small" alignment. */
1070 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1071 break;
1073 /* Skip variables that aren't partition representatives. */
1074 if (stack_vars[i].representative != i)
1075 continue;
1077 /* Skip variables that have already had rtl assigned. See also
1078 add_stack_var where we perpetrate this pc_rtx hack. */
1079 decl = stack_vars[i].decl;
1080 if (TREE_CODE (decl) == SSA_NAME
1081 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1082 : DECL_RTL (decl) != pc_rtx)
1083 continue;
1085 large_size += alignb - 1;
1086 large_size &= -(HOST_WIDE_INT)alignb;
1087 large_size += stack_vars[i].size;
1091 for (si = 0; si < n; ++si)
1093 rtx base;
1094 unsigned base_align, alignb;
1095 HOST_WIDE_INT offset;
1097 i = stack_vars_sorted[si];
1099 /* Skip variables that aren't partition representatives, for now. */
1100 if (stack_vars[i].representative != i)
1101 continue;
1103 /* Skip variables that have already had rtl assigned. See also
1104 add_stack_var where we perpetrate this pc_rtx hack. */
1105 decl = stack_vars[i].decl;
1106 if (TREE_CODE (decl) == SSA_NAME
1107 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1108 : DECL_RTL (decl) != pc_rtx)
1109 continue;
1111 /* Check the predicate to see whether this variable should be
1112 allocated in this pass. */
1113 if (pred && !pred (i))
1114 continue;
1116 alignb = stack_vars[i].alignb;
1117 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1119 base = virtual_stack_vars_rtx;
1120 if ((asan_sanitize_stack_p ())
1121 && pred)
1123 HOST_WIDE_INT prev_offset
1124 = align_base (frame_offset,
1125 MAX (alignb, ASAN_RED_ZONE_SIZE),
1126 !FRAME_GROWS_DOWNWARD);
1127 tree repr_decl = NULL_TREE;
1128 offset
1129 = alloc_stack_frame_space (stack_vars[i].size
1130 + ASAN_RED_ZONE_SIZE,
1131 MAX (alignb, ASAN_RED_ZONE_SIZE));
1133 data->asan_vec.safe_push (prev_offset);
1134 data->asan_vec.safe_push (offset + stack_vars[i].size);
1135 /* Find best representative of the partition.
1136 Prefer those with DECL_NAME, even better
1137 satisfying asan_protect_stack_decl predicate. */
1138 for (j = i; j != EOC; j = stack_vars[j].next)
1139 if (asan_protect_stack_decl (stack_vars[j].decl)
1140 && DECL_NAME (stack_vars[j].decl))
1142 repr_decl = stack_vars[j].decl;
1143 break;
1145 else if (repr_decl == NULL_TREE
1146 && DECL_P (stack_vars[j].decl)
1147 && DECL_NAME (stack_vars[j].decl))
1148 repr_decl = stack_vars[j].decl;
1149 if (repr_decl == NULL_TREE)
1150 repr_decl = stack_vars[i].decl;
1151 data->asan_decl_vec.safe_push (repr_decl);
1152 data->asan_alignb = MAX (data->asan_alignb, alignb);
1153 if (data->asan_base == NULL)
1154 data->asan_base = gen_reg_rtx (Pmode);
1155 base = data->asan_base;
1157 if (!STRICT_ALIGNMENT)
1158 base_align = crtl->max_used_stack_slot_alignment;
1159 else
1160 base_align = MAX (crtl->max_used_stack_slot_alignment,
1161 GET_MODE_ALIGNMENT (SImode)
1162 << ASAN_SHADOW_SHIFT);
1164 else
1166 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1167 base_align = crtl->max_used_stack_slot_alignment;
1170 else
1172 /* Large alignment is only processed in the last pass. */
1173 if (pred)
1174 continue;
1176 /* If there were any variables requiring "large" alignment, allocate
1177 space. */
1178 if (large_size > 0 && ! large_allocation_done)
1180 HOST_WIDE_INT loffset;
1181 rtx large_allocsize;
1183 large_allocsize = GEN_INT (large_size);
1184 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1185 loffset = alloc_stack_frame_space
1186 (INTVAL (large_allocsize),
1187 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1188 large_base = get_dynamic_stack_base (loffset, large_align);
1189 large_allocation_done = true;
1191 gcc_assert (large_base != NULL);
1193 large_alloc += alignb - 1;
1194 large_alloc &= -(HOST_WIDE_INT)alignb;
1195 offset = large_alloc;
1196 large_alloc += stack_vars[i].size;
1198 base = large_base;
1199 base_align = large_align;
1202 /* Create rtl for each variable based on their location within the
1203 partition. */
1204 for (j = i; j != EOC; j = stack_vars[j].next)
1206 expand_one_stack_var_at (stack_vars[j].decl,
1207 base, base_align,
1208 offset);
1212 gcc_assert (large_alloc == large_size);
1215 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1216 static HOST_WIDE_INT
1217 account_stack_vars (void)
1219 size_t si, j, i, n = stack_vars_num;
1220 HOST_WIDE_INT size = 0;
1222 for (si = 0; si < n; ++si)
1224 i = stack_vars_sorted[si];
1226 /* Skip variables that aren't partition representatives, for now. */
1227 if (stack_vars[i].representative != i)
1228 continue;
1230 size += stack_vars[i].size;
1231 for (j = i; j != EOC; j = stack_vars[j].next)
1232 set_rtl (stack_vars[j].decl, NULL);
1234 return size;
1237 /* Record the RTL assignment X for the default def of PARM. */
1239 extern void
1240 set_parm_rtl (tree parm, rtx x)
1242 gcc_assert (TREE_CODE (parm) == PARM_DECL
1243 || TREE_CODE (parm) == RESULT_DECL);
1245 if (x && !MEM_P (x))
1247 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1248 TYPE_MODE (TREE_TYPE (parm)),
1249 TYPE_ALIGN (TREE_TYPE (parm)));
1251 /* If the variable alignment is very large we'll dynamicaly
1252 allocate it, which means that in-frame portion is just a
1253 pointer. ??? We've got a pseudo for sure here, do we
1254 actually dynamically allocate its spilling area if needed?
1255 ??? Isn't it a problem when POINTER_SIZE also exceeds
1256 MAX_SUPPORTED_STACK_ALIGNMENT, as on cris and lm32? */
1257 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1258 align = POINTER_SIZE;
1260 record_alignment_for_reg_var (align);
1263 tree ssa = ssa_default_def (cfun, parm);
1264 if (!ssa)
1265 return set_rtl (parm, x);
1267 int part = var_to_partition (SA.map, ssa);
1268 gcc_assert (part != NO_PARTITION);
1270 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1271 gcc_assert (changed);
1273 set_rtl (ssa, x);
1274 gcc_assert (DECL_RTL (parm) == x);
1277 /* A subroutine of expand_one_var. Called to immediately assign rtl
1278 to a variable to be allocated in the stack frame. */
1280 static void
1281 expand_one_stack_var_1 (tree var)
1283 HOST_WIDE_INT size, offset;
1284 unsigned byte_align;
1286 if (TREE_CODE (var) == SSA_NAME)
1288 tree type = TREE_TYPE (var);
1289 size = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1290 byte_align = TYPE_ALIGN_UNIT (type);
1292 else
1294 size = tree_to_uhwi (DECL_SIZE_UNIT (var));
1295 byte_align = align_local_variable (var);
1298 /* We handle highly aligned variables in expand_stack_vars. */
1299 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1301 offset = alloc_stack_frame_space (size, byte_align);
1303 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1304 crtl->max_used_stack_slot_alignment, offset);
1307 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1308 already assigned some MEM. */
1310 static void
1311 expand_one_stack_var (tree var)
1313 if (TREE_CODE (var) == SSA_NAME)
1315 int part = var_to_partition (SA.map, var);
1316 if (part != NO_PARTITION)
1318 rtx x = SA.partition_to_pseudo[part];
1319 gcc_assert (x);
1320 gcc_assert (MEM_P (x));
1321 return;
1325 return expand_one_stack_var_1 (var);
1328 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1329 that will reside in a hard register. */
1331 static void
1332 expand_one_hard_reg_var (tree var)
1334 rest_of_decl_compilation (var, 0, 0);
1337 /* Record the alignment requirements of some variable assigned to a
1338 pseudo. */
1340 static void
1341 record_alignment_for_reg_var (unsigned int align)
1343 if (SUPPORTS_STACK_ALIGNMENT
1344 && crtl->stack_alignment_estimated < align)
1346 /* stack_alignment_estimated shouldn't change after stack
1347 realign decision made */
1348 gcc_assert (!crtl->stack_realign_processed);
1349 crtl->stack_alignment_estimated = align;
1352 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1353 So here we only make sure stack_alignment_needed >= align. */
1354 if (crtl->stack_alignment_needed < align)
1355 crtl->stack_alignment_needed = align;
1356 if (crtl->max_used_stack_slot_alignment < align)
1357 crtl->max_used_stack_slot_alignment = align;
1360 /* Create RTL for an SSA partition. */
1362 static void
1363 expand_one_ssa_partition (tree var)
1365 int part = var_to_partition (SA.map, var);
1366 gcc_assert (part != NO_PARTITION);
1368 if (SA.partition_to_pseudo[part])
1369 return;
1371 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1372 TYPE_MODE (TREE_TYPE (var)),
1373 TYPE_ALIGN (TREE_TYPE (var)));
1375 /* If the variable alignment is very large we'll dynamicaly allocate
1376 it, which means that in-frame portion is just a pointer. */
1377 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1378 align = POINTER_SIZE;
1380 record_alignment_for_reg_var (align);
1382 if (!use_register_for_decl (var))
1384 if (defer_stack_allocation (var, true))
1385 add_stack_var (var);
1386 else
1387 expand_one_stack_var_1 (var);
1388 return;
1391 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1393 rtx x = gen_reg_rtx (reg_mode);
1395 set_rtl (var, x);
1398 /* Record the association between the RTL generated for partition PART
1399 and the underlying variable of the SSA_NAME VAR. */
1401 static void
1402 adjust_one_expanded_partition_var (tree var)
1404 if (!var)
1405 return;
1407 tree decl = SSA_NAME_VAR (var);
1409 int part = var_to_partition (SA.map, var);
1410 if (part == NO_PARTITION)
1411 return;
1413 rtx x = SA.partition_to_pseudo[part];
1415 gcc_assert (x);
1417 set_rtl (var, x);
1419 if (!REG_P (x))
1420 return;
1422 /* Note if the object is a user variable. */
1423 if (decl && !DECL_ARTIFICIAL (decl))
1424 mark_user_reg (x);
1426 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1427 mark_reg_pointer (x, get_pointer_alignment (var));
1430 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1431 that will reside in a pseudo register. */
1433 static void
1434 expand_one_register_var (tree var)
1436 if (TREE_CODE (var) == SSA_NAME)
1438 int part = var_to_partition (SA.map, var);
1439 if (part != NO_PARTITION)
1441 rtx x = SA.partition_to_pseudo[part];
1442 gcc_assert (x);
1443 gcc_assert (REG_P (x));
1444 return;
1446 gcc_unreachable ();
1449 tree decl = var;
1450 tree type = TREE_TYPE (decl);
1451 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1452 rtx x = gen_reg_rtx (reg_mode);
1454 set_rtl (var, x);
1456 /* Note if the object is a user variable. */
1457 if (!DECL_ARTIFICIAL (decl))
1458 mark_user_reg (x);
1460 if (POINTER_TYPE_P (type))
1461 mark_reg_pointer (x, get_pointer_alignment (var));
1464 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1465 has some associated error, e.g. its type is error-mark. We just need
1466 to pick something that won't crash the rest of the compiler. */
1468 static void
1469 expand_one_error_var (tree var)
1471 machine_mode mode = DECL_MODE (var);
1472 rtx x;
1474 if (mode == BLKmode)
1475 x = gen_rtx_MEM (BLKmode, const0_rtx);
1476 else if (mode == VOIDmode)
1477 x = const0_rtx;
1478 else
1479 x = gen_reg_rtx (mode);
1481 SET_DECL_RTL (var, x);
1484 /* A subroutine of expand_one_var. VAR is a variable that will be
1485 allocated to the local stack frame. Return true if we wish to
1486 add VAR to STACK_VARS so that it will be coalesced with other
1487 variables. Return false to allocate VAR immediately.
1489 This function is used to reduce the number of variables considered
1490 for coalescing, which reduces the size of the quadratic problem. */
1492 static bool
1493 defer_stack_allocation (tree var, bool toplevel)
1495 tree size_unit = TREE_CODE (var) == SSA_NAME
1496 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1497 : DECL_SIZE_UNIT (var);
1499 /* Whether the variable is small enough for immediate allocation not to be
1500 a problem with regard to the frame size. */
1501 bool smallish
1502 = ((HOST_WIDE_INT) tree_to_uhwi (size_unit)
1503 < PARAM_VALUE (PARAM_MIN_SIZE_FOR_STACK_SHARING));
1505 /* If stack protection is enabled, *all* stack variables must be deferred,
1506 so that we can re-order the strings to the top of the frame.
1507 Similarly for Address Sanitizer. */
1508 if (flag_stack_protect || asan_sanitize_stack_p ())
1509 return true;
1511 unsigned int align = TREE_CODE (var) == SSA_NAME
1512 ? TYPE_ALIGN (TREE_TYPE (var))
1513 : DECL_ALIGN (var);
1515 /* We handle "large" alignment via dynamic allocation. We want to handle
1516 this extra complication in only one place, so defer them. */
1517 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1518 return true;
1520 bool ignored = TREE_CODE (var) == SSA_NAME
1521 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1522 : DECL_IGNORED_P (var);
1524 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1525 might be detached from their block and appear at toplevel when we reach
1526 here. We want to coalesce them with variables from other blocks when
1527 the immediate contribution to the frame size would be noticeable. */
1528 if (toplevel && optimize > 0 && ignored && !smallish)
1529 return true;
1531 /* Variables declared in the outermost scope automatically conflict
1532 with every other variable. The only reason to want to defer them
1533 at all is that, after sorting, we can more efficiently pack
1534 small variables in the stack frame. Continue to defer at -O2. */
1535 if (toplevel && optimize < 2)
1536 return false;
1538 /* Without optimization, *most* variables are allocated from the
1539 stack, which makes the quadratic problem large exactly when we
1540 want compilation to proceed as quickly as possible. On the
1541 other hand, we don't want the function's stack frame size to
1542 get completely out of hand. So we avoid adding scalars and
1543 "small" aggregates to the list at all. */
1544 if (optimize == 0 && smallish)
1545 return false;
1547 return true;
1550 /* A subroutine of expand_used_vars. Expand one variable according to
1551 its flavor. Variables to be placed on the stack are not actually
1552 expanded yet, merely recorded.
1553 When REALLY_EXPAND is false, only add stack values to be allocated.
1554 Return stack usage this variable is supposed to take.
1557 static HOST_WIDE_INT
1558 expand_one_var (tree var, bool toplevel, bool really_expand)
1560 unsigned int align = BITS_PER_UNIT;
1561 tree origvar = var;
1563 var = SSAVAR (var);
1565 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1567 if (is_global_var (var))
1568 return 0;
1570 /* Because we don't know if VAR will be in register or on stack,
1571 we conservatively assume it will be on stack even if VAR is
1572 eventually put into register after RA pass. For non-automatic
1573 variables, which won't be on stack, we collect alignment of
1574 type and ignore user specified alignment. Similarly for
1575 SSA_NAMEs for which use_register_for_decl returns true. */
1576 if (TREE_STATIC (var)
1577 || DECL_EXTERNAL (var)
1578 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1579 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1580 TYPE_MODE (TREE_TYPE (var)),
1581 TYPE_ALIGN (TREE_TYPE (var)));
1582 else if (DECL_HAS_VALUE_EXPR_P (var)
1583 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1584 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1585 or variables which were assigned a stack slot already by
1586 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1587 changed from the offset chosen to it. */
1588 align = crtl->stack_alignment_estimated;
1589 else
1590 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1592 /* If the variable alignment is very large we'll dynamicaly allocate
1593 it, which means that in-frame portion is just a pointer. */
1594 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1595 align = POINTER_SIZE;
1598 record_alignment_for_reg_var (align);
1600 if (TREE_CODE (origvar) == SSA_NAME)
1602 gcc_assert (!VAR_P (var)
1603 || (!DECL_EXTERNAL (var)
1604 && !DECL_HAS_VALUE_EXPR_P (var)
1605 && !TREE_STATIC (var)
1606 && TREE_TYPE (var) != error_mark_node
1607 && !DECL_HARD_REGISTER (var)
1608 && really_expand));
1610 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1612 else if (DECL_EXTERNAL (var))
1614 else if (DECL_HAS_VALUE_EXPR_P (var))
1616 else if (TREE_STATIC (var))
1618 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1620 else if (TREE_TYPE (var) == error_mark_node)
1622 if (really_expand)
1623 expand_one_error_var (var);
1625 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1627 if (really_expand)
1629 expand_one_hard_reg_var (var);
1630 if (!DECL_HARD_REGISTER (var))
1631 /* Invalid register specification. */
1632 expand_one_error_var (var);
1635 else if (use_register_for_decl (var))
1637 if (really_expand)
1638 expand_one_register_var (origvar);
1640 else if (! valid_constant_size_p (DECL_SIZE_UNIT (var)))
1642 /* Reject variables which cover more than half of the address-space. */
1643 if (really_expand)
1645 error ("size of variable %q+D is too large", var);
1646 expand_one_error_var (var);
1649 else if (defer_stack_allocation (var, toplevel))
1650 add_stack_var (origvar);
1651 else
1653 if (really_expand)
1655 if (lookup_attribute ("naked",
1656 DECL_ATTRIBUTES (current_function_decl)))
1657 error ("cannot allocate stack for variable %q+D, naked function.",
1658 var);
1660 expand_one_stack_var (origvar);
1664 return tree_to_uhwi (DECL_SIZE_UNIT (var));
1666 return 0;
1669 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1670 expanding variables. Those variables that can be put into registers
1671 are allocated pseudos; those that can't are put on the stack.
1673 TOPLEVEL is true if this is the outermost BLOCK. */
1675 static void
1676 expand_used_vars_for_block (tree block, bool toplevel)
1678 tree t;
1680 /* Expand all variables at this level. */
1681 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1682 if (TREE_USED (t)
1683 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1684 || !DECL_NONSHAREABLE (t)))
1685 expand_one_var (t, toplevel, true);
1687 /* Expand all variables at containing levels. */
1688 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1689 expand_used_vars_for_block (t, false);
1692 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1693 and clear TREE_USED on all local variables. */
1695 static void
1696 clear_tree_used (tree block)
1698 tree t;
1700 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1701 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1702 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1703 || !DECL_NONSHAREABLE (t))
1704 TREE_USED (t) = 0;
1706 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1707 clear_tree_used (t);
1710 enum {
1711 SPCT_FLAG_DEFAULT = 1,
1712 SPCT_FLAG_ALL = 2,
1713 SPCT_FLAG_STRONG = 3,
1714 SPCT_FLAG_EXPLICIT = 4
1717 /* Examine TYPE and determine a bit mask of the following features. */
1719 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1720 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1721 #define SPCT_HAS_ARRAY 4
1722 #define SPCT_HAS_AGGREGATE 8
1724 static unsigned int
1725 stack_protect_classify_type (tree type)
1727 unsigned int ret = 0;
1728 tree t;
1730 switch (TREE_CODE (type))
1732 case ARRAY_TYPE:
1733 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1734 if (t == char_type_node
1735 || t == signed_char_type_node
1736 || t == unsigned_char_type_node)
1738 unsigned HOST_WIDE_INT max = PARAM_VALUE (PARAM_SSP_BUFFER_SIZE);
1739 unsigned HOST_WIDE_INT len;
1741 if (!TYPE_SIZE_UNIT (type)
1742 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1743 len = max;
1744 else
1745 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1747 if (len < max)
1748 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1749 else
1750 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1752 else
1753 ret = SPCT_HAS_ARRAY;
1754 break;
1756 case UNION_TYPE:
1757 case QUAL_UNION_TYPE:
1758 case RECORD_TYPE:
1759 ret = SPCT_HAS_AGGREGATE;
1760 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1761 if (TREE_CODE (t) == FIELD_DECL)
1762 ret |= stack_protect_classify_type (TREE_TYPE (t));
1763 break;
1765 default:
1766 break;
1769 return ret;
1772 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1773 part of the local stack frame. Remember if we ever return nonzero for
1774 any variable in this function. The return value is the phase number in
1775 which the variable should be allocated. */
1777 static int
1778 stack_protect_decl_phase (tree decl)
1780 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1781 int ret = 0;
1783 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1784 has_short_buffer = true;
1786 if (flag_stack_protect == SPCT_FLAG_ALL
1787 || flag_stack_protect == SPCT_FLAG_STRONG
1788 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1789 && lookup_attribute ("stack_protect",
1790 DECL_ATTRIBUTES (current_function_decl))))
1792 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1793 && !(bits & SPCT_HAS_AGGREGATE))
1794 ret = 1;
1795 else if (bits & SPCT_HAS_ARRAY)
1796 ret = 2;
1798 else
1799 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1801 if (ret)
1802 has_protected_decls = true;
1804 return ret;
1807 /* Two helper routines that check for phase 1 and phase 2. These are used
1808 as callbacks for expand_stack_vars. */
1810 static bool
1811 stack_protect_decl_phase_1 (size_t i)
1813 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1816 static bool
1817 stack_protect_decl_phase_2 (size_t i)
1819 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1822 /* And helper function that checks for asan phase (with stack protector
1823 it is phase 3). This is used as callback for expand_stack_vars.
1824 Returns true if any of the vars in the partition need to be protected. */
1826 static bool
1827 asan_decl_phase_3 (size_t i)
1829 while (i != EOC)
1831 if (asan_protect_stack_decl (stack_vars[i].decl))
1832 return true;
1833 i = stack_vars[i].next;
1835 return false;
1838 /* Ensure that variables in different stack protection phases conflict
1839 so that they are not merged and share the same stack slot. */
1841 static void
1842 add_stack_protection_conflicts (void)
1844 size_t i, j, n = stack_vars_num;
1845 unsigned char *phase;
1847 phase = XNEWVEC (unsigned char, n);
1848 for (i = 0; i < n; ++i)
1849 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1851 for (i = 0; i < n; ++i)
1853 unsigned char ph_i = phase[i];
1854 for (j = i + 1; j < n; ++j)
1855 if (ph_i != phase[j])
1856 add_stack_var_conflict (i, j);
1859 XDELETEVEC (phase);
1862 /* Create a decl for the guard at the top of the stack frame. */
1864 static void
1865 create_stack_guard (void)
1867 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1868 VAR_DECL, NULL, ptr_type_node);
1869 TREE_THIS_VOLATILE (guard) = 1;
1870 TREE_USED (guard) = 1;
1871 expand_one_stack_var (guard);
1872 crtl->stack_protect_guard = guard;
1875 /* Prepare for expanding variables. */
1876 static void
1877 init_vars_expansion (void)
1879 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1880 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1882 /* A map from decl to stack partition. */
1883 decl_to_stack_part = new hash_map<tree, size_t>;
1885 /* Initialize local stack smashing state. */
1886 has_protected_decls = false;
1887 has_short_buffer = false;
1890 /* Free up stack variable graph data. */
1891 static void
1892 fini_vars_expansion (void)
1894 bitmap_obstack_release (&stack_var_bitmap_obstack);
1895 if (stack_vars)
1896 XDELETEVEC (stack_vars);
1897 if (stack_vars_sorted)
1898 XDELETEVEC (stack_vars_sorted);
1899 stack_vars = NULL;
1900 stack_vars_sorted = NULL;
1901 stack_vars_alloc = stack_vars_num = 0;
1902 delete decl_to_stack_part;
1903 decl_to_stack_part = NULL;
1906 /* Make a fair guess for the size of the stack frame of the function
1907 in NODE. This doesn't have to be exact, the result is only used in
1908 the inline heuristics. So we don't want to run the full stack var
1909 packing algorithm (which is quadratic in the number of stack vars).
1910 Instead, we calculate the total size of all stack vars. This turns
1911 out to be a pretty fair estimate -- packing of stack vars doesn't
1912 happen very often. */
1914 HOST_WIDE_INT
1915 estimated_stack_frame_size (struct cgraph_node *node)
1917 HOST_WIDE_INT size = 0;
1918 size_t i;
1919 tree var;
1920 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1922 push_cfun (fn);
1924 init_vars_expansion ();
1926 FOR_EACH_LOCAL_DECL (fn, i, var)
1927 if (auto_var_in_fn_p (var, fn->decl))
1928 size += expand_one_var (var, true, false);
1930 if (stack_vars_num > 0)
1932 /* Fake sorting the stack vars for account_stack_vars (). */
1933 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1934 for (i = 0; i < stack_vars_num; ++i)
1935 stack_vars_sorted[i] = i;
1936 size += account_stack_vars ();
1939 fini_vars_expansion ();
1940 pop_cfun ();
1941 return size;
1944 /* Helper routine to check if a record or union contains an array field. */
1946 static int
1947 record_or_union_type_has_array_p (const_tree tree_type)
1949 tree fields = TYPE_FIELDS (tree_type);
1950 tree f;
1952 for (f = fields; f; f = DECL_CHAIN (f))
1953 if (TREE_CODE (f) == FIELD_DECL)
1955 tree field_type = TREE_TYPE (f);
1956 if (RECORD_OR_UNION_TYPE_P (field_type)
1957 && record_or_union_type_has_array_p (field_type))
1958 return 1;
1959 if (TREE_CODE (field_type) == ARRAY_TYPE)
1960 return 1;
1962 return 0;
1965 /* Check if the current function has local referenced variables that
1966 have their addresses taken, contain an array, or are arrays. */
1968 static bool
1969 stack_protect_decl_p ()
1971 unsigned i;
1972 tree var;
1974 FOR_EACH_LOCAL_DECL (cfun, i, var)
1975 if (!is_global_var (var))
1977 tree var_type = TREE_TYPE (var);
1978 if (VAR_P (var)
1979 && (TREE_CODE (var_type) == ARRAY_TYPE
1980 || TREE_ADDRESSABLE (var)
1981 || (RECORD_OR_UNION_TYPE_P (var_type)
1982 && record_or_union_type_has_array_p (var_type))))
1983 return true;
1985 return false;
1988 /* Check if the current function has calls that use a return slot. */
1990 static bool
1991 stack_protect_return_slot_p ()
1993 basic_block bb;
1995 FOR_ALL_BB_FN (bb, cfun)
1996 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
1997 !gsi_end_p (gsi); gsi_next (&gsi))
1999 gimple *stmt = gsi_stmt (gsi);
2000 /* This assumes that calls to internal-only functions never
2001 use a return slot. */
2002 if (is_gimple_call (stmt)
2003 && !gimple_call_internal_p (stmt)
2004 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2005 gimple_call_fndecl (stmt)))
2006 return true;
2008 return false;
2011 /* Expand all variables used in the function. */
2013 static rtx_insn *
2014 expand_used_vars (void)
2016 tree var, outer_block = DECL_INITIAL (current_function_decl);
2017 auto_vec<tree> maybe_local_decls;
2018 rtx_insn *var_end_seq = NULL;
2019 unsigned i;
2020 unsigned len;
2021 bool gen_stack_protect_signal = false;
2023 /* Compute the phase of the stack frame for this function. */
2025 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2026 int off = STARTING_FRAME_OFFSET % align;
2027 frame_phase = off ? align - off : 0;
2030 /* Set TREE_USED on all variables in the local_decls. */
2031 FOR_EACH_LOCAL_DECL (cfun, i, var)
2032 TREE_USED (var) = 1;
2033 /* Clear TREE_USED on all variables associated with a block scope. */
2034 clear_tree_used (DECL_INITIAL (current_function_decl));
2036 init_vars_expansion ();
2038 if (targetm.use_pseudo_pic_reg ())
2039 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2041 for (i = 0; i < SA.map->num_partitions; i++)
2043 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2044 continue;
2046 tree var = partition_to_var (SA.map, i);
2048 gcc_assert (!virtual_operand_p (var));
2050 expand_one_ssa_partition (var);
2053 if (flag_stack_protect == SPCT_FLAG_STRONG)
2054 gen_stack_protect_signal
2055 = stack_protect_decl_p () || stack_protect_return_slot_p ();
2057 /* At this point all variables on the local_decls with TREE_USED
2058 set are not associated with any block scope. Lay them out. */
2060 len = vec_safe_length (cfun->local_decls);
2061 FOR_EACH_LOCAL_DECL (cfun, i, var)
2063 bool expand_now = false;
2065 /* Expanded above already. */
2066 if (is_gimple_reg (var))
2068 TREE_USED (var) = 0;
2069 goto next;
2071 /* We didn't set a block for static or extern because it's hard
2072 to tell the difference between a global variable (re)declared
2073 in a local scope, and one that's really declared there to
2074 begin with. And it doesn't really matter much, since we're
2075 not giving them stack space. Expand them now. */
2076 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2077 expand_now = true;
2079 /* Expand variables not associated with any block now. Those created by
2080 the optimizers could be live anywhere in the function. Those that
2081 could possibly have been scoped originally and detached from their
2082 block will have their allocation deferred so we coalesce them with
2083 others when optimization is enabled. */
2084 else if (TREE_USED (var))
2085 expand_now = true;
2087 /* Finally, mark all variables on the list as used. We'll use
2088 this in a moment when we expand those associated with scopes. */
2089 TREE_USED (var) = 1;
2091 if (expand_now)
2092 expand_one_var (var, true, true);
2094 next:
2095 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2097 rtx rtl = DECL_RTL_IF_SET (var);
2099 /* Keep artificial non-ignored vars in cfun->local_decls
2100 chain until instantiate_decls. */
2101 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2102 add_local_decl (cfun, var);
2103 else if (rtl == NULL_RTX)
2104 /* If rtl isn't set yet, which can happen e.g. with
2105 -fstack-protector, retry before returning from this
2106 function. */
2107 maybe_local_decls.safe_push (var);
2111 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2113 +-----------------+-----------------+
2114 | ...processed... | ...duplicates...|
2115 +-----------------+-----------------+
2117 +-- LEN points here.
2119 We just want the duplicates, as those are the artificial
2120 non-ignored vars that we want to keep until instantiate_decls.
2121 Move them down and truncate the array. */
2122 if (!vec_safe_is_empty (cfun->local_decls))
2123 cfun->local_decls->block_remove (0, len);
2125 /* At this point, all variables within the block tree with TREE_USED
2126 set are actually used by the optimized function. Lay them out. */
2127 expand_used_vars_for_block (outer_block, true);
2129 if (stack_vars_num > 0)
2131 add_scope_conflicts ();
2133 /* If stack protection is enabled, we don't share space between
2134 vulnerable data and non-vulnerable data. */
2135 if (flag_stack_protect != 0
2136 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2137 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2138 && lookup_attribute ("stack_protect",
2139 DECL_ATTRIBUTES (current_function_decl)))))
2140 add_stack_protection_conflicts ();
2142 /* Now that we have collected all stack variables, and have computed a
2143 minimal interference graph, attempt to save some stack space. */
2144 partition_stack_vars ();
2145 if (dump_file)
2146 dump_stack_var_partition ();
2149 switch (flag_stack_protect)
2151 case SPCT_FLAG_ALL:
2152 create_stack_guard ();
2153 break;
2155 case SPCT_FLAG_STRONG:
2156 if (gen_stack_protect_signal
2157 || cfun->calls_alloca || has_protected_decls
2158 || lookup_attribute ("stack_protect",
2159 DECL_ATTRIBUTES (current_function_decl)))
2160 create_stack_guard ();
2161 break;
2163 case SPCT_FLAG_DEFAULT:
2164 if (cfun->calls_alloca || has_protected_decls
2165 || lookup_attribute ("stack_protect",
2166 DECL_ATTRIBUTES (current_function_decl)))
2167 create_stack_guard ();
2168 break;
2170 case SPCT_FLAG_EXPLICIT:
2171 if (lookup_attribute ("stack_protect",
2172 DECL_ATTRIBUTES (current_function_decl)))
2173 create_stack_guard ();
2174 break;
2175 default:
2179 /* Assign rtl to each variable based on these partitions. */
2180 if (stack_vars_num > 0)
2182 struct stack_vars_data data;
2184 data.asan_base = NULL_RTX;
2185 data.asan_alignb = 0;
2187 /* Reorder decls to be protected by iterating over the variables
2188 array multiple times, and allocating out of each phase in turn. */
2189 /* ??? We could probably integrate this into the qsort we did
2190 earlier, such that we naturally see these variables first,
2191 and thus naturally allocate things in the right order. */
2192 if (has_protected_decls)
2194 /* Phase 1 contains only character arrays. */
2195 expand_stack_vars (stack_protect_decl_phase_1, &data);
2197 /* Phase 2 contains other kinds of arrays. */
2198 if (flag_stack_protect == SPCT_FLAG_ALL
2199 || flag_stack_protect == SPCT_FLAG_STRONG
2200 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2201 && lookup_attribute ("stack_protect",
2202 DECL_ATTRIBUTES (current_function_decl))))
2203 expand_stack_vars (stack_protect_decl_phase_2, &data);
2206 if (asan_sanitize_stack_p ())
2207 /* Phase 3, any partitions that need asan protection
2208 in addition to phase 1 and 2. */
2209 expand_stack_vars (asan_decl_phase_3, &data);
2211 if (!data.asan_vec.is_empty ())
2213 HOST_WIDE_INT prev_offset = frame_offset;
2214 HOST_WIDE_INT offset, sz, redzonesz;
2215 redzonesz = ASAN_RED_ZONE_SIZE;
2216 sz = data.asan_vec[0] - prev_offset;
2217 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2218 && data.asan_alignb <= 4096
2219 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2220 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2221 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2222 offset
2223 = alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE);
2224 data.asan_vec.safe_push (prev_offset);
2225 data.asan_vec.safe_push (offset);
2226 /* Leave space for alignment if STRICT_ALIGNMENT. */
2227 if (STRICT_ALIGNMENT)
2228 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2229 << ASAN_SHADOW_SHIFT)
2230 / BITS_PER_UNIT, 1);
2232 var_end_seq
2233 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2234 data.asan_base,
2235 data.asan_alignb,
2236 data.asan_vec.address (),
2237 data.asan_decl_vec.address (),
2238 data.asan_vec.length ());
2241 expand_stack_vars (NULL, &data);
2244 fini_vars_expansion ();
2246 /* If there were any artificial non-ignored vars without rtl
2247 found earlier, see if deferred stack allocation hasn't assigned
2248 rtl to them. */
2249 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2251 rtx rtl = DECL_RTL_IF_SET (var);
2253 /* Keep artificial non-ignored vars in cfun->local_decls
2254 chain until instantiate_decls. */
2255 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2256 add_local_decl (cfun, var);
2259 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2260 if (STACK_ALIGNMENT_NEEDED)
2262 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2263 if (!FRAME_GROWS_DOWNWARD)
2264 frame_offset += align - 1;
2265 frame_offset &= -align;
2268 return var_end_seq;
2272 /* If we need to produce a detailed dump, print the tree representation
2273 for STMT to the dump file. SINCE is the last RTX after which the RTL
2274 generated for STMT should have been appended. */
2276 static void
2277 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2279 if (dump_file && (dump_flags & TDF_DETAILS))
2281 fprintf (dump_file, "\n;; ");
2282 print_gimple_stmt (dump_file, stmt, 0,
2283 TDF_SLIM | (dump_flags & TDF_LINENO));
2284 fprintf (dump_file, "\n");
2286 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2290 /* Maps the blocks that do not contain tree labels to rtx labels. */
2292 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2294 /* Returns the label_rtx expression for a label starting basic block BB. */
2296 static rtx_code_label *
2297 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2299 gimple_stmt_iterator gsi;
2300 tree lab;
2302 if (bb->flags & BB_RTL)
2303 return block_label (bb);
2305 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2306 if (elt)
2307 return *elt;
2309 /* Find the tree label if it is present. */
2311 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2313 glabel *lab_stmt;
2315 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2316 if (!lab_stmt)
2317 break;
2319 lab = gimple_label_label (lab_stmt);
2320 if (DECL_NONLOCAL (lab))
2321 break;
2323 return jump_target_rtx (lab);
2326 rtx_code_label *l = gen_label_rtx ();
2327 lab_rtx_for_bb->put (bb, l);
2328 return l;
2332 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2333 of a basic block where we just expanded the conditional at the end,
2334 possibly clean up the CFG and instruction sequence. LAST is the
2335 last instruction before the just emitted jump sequence. */
2337 static void
2338 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2340 /* Special case: when jumpif decides that the condition is
2341 trivial it emits an unconditional jump (and the necessary
2342 barrier). But we still have two edges, the fallthru one is
2343 wrong. purge_dead_edges would clean this up later. Unfortunately
2344 we have to insert insns (and split edges) before
2345 find_many_sub_basic_blocks and hence before purge_dead_edges.
2346 But splitting edges might create new blocks which depend on the
2347 fact that if there are two edges there's no barrier. So the
2348 barrier would get lost and verify_flow_info would ICE. Instead
2349 of auditing all edge splitters to care for the barrier (which
2350 normally isn't there in a cleaned CFG), fix it here. */
2351 if (BARRIER_P (get_last_insn ()))
2353 rtx_insn *insn;
2354 remove_edge (e);
2355 /* Now, we have a single successor block, if we have insns to
2356 insert on the remaining edge we potentially will insert
2357 it at the end of this block (if the dest block isn't feasible)
2358 in order to avoid splitting the edge. This insertion will take
2359 place in front of the last jump. But we might have emitted
2360 multiple jumps (conditional and one unconditional) to the
2361 same destination. Inserting in front of the last one then
2362 is a problem. See PR 40021. We fix this by deleting all
2363 jumps except the last unconditional one. */
2364 insn = PREV_INSN (get_last_insn ());
2365 /* Make sure we have an unconditional jump. Otherwise we're
2366 confused. */
2367 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2368 for (insn = PREV_INSN (insn); insn != last;)
2370 insn = PREV_INSN (insn);
2371 if (JUMP_P (NEXT_INSN (insn)))
2373 if (!any_condjump_p (NEXT_INSN (insn)))
2375 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2376 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2378 delete_insn (NEXT_INSN (insn));
2384 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2385 Returns a new basic block if we've terminated the current basic
2386 block and created a new one. */
2388 static basic_block
2389 expand_gimple_cond (basic_block bb, gcond *stmt)
2391 basic_block new_bb, dest;
2392 edge true_edge;
2393 edge false_edge;
2394 rtx_insn *last2, *last;
2395 enum tree_code code;
2396 tree op0, op1;
2398 code = gimple_cond_code (stmt);
2399 op0 = gimple_cond_lhs (stmt);
2400 op1 = gimple_cond_rhs (stmt);
2401 /* We're sometimes presented with such code:
2402 D.123_1 = x < y;
2403 if (D.123_1 != 0)
2405 This would expand to two comparisons which then later might
2406 be cleaned up by combine. But some pattern matchers like if-conversion
2407 work better when there's only one compare, so make up for this
2408 here as special exception if TER would have made the same change. */
2409 if (SA.values
2410 && TREE_CODE (op0) == SSA_NAME
2411 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2412 && TREE_CODE (op1) == INTEGER_CST
2413 && ((gimple_cond_code (stmt) == NE_EXPR
2414 && integer_zerop (op1))
2415 || (gimple_cond_code (stmt) == EQ_EXPR
2416 && integer_onep (op1)))
2417 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2419 gimple *second = SSA_NAME_DEF_STMT (op0);
2420 if (gimple_code (second) == GIMPLE_ASSIGN)
2422 enum tree_code code2 = gimple_assign_rhs_code (second);
2423 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2425 code = code2;
2426 op0 = gimple_assign_rhs1 (second);
2427 op1 = gimple_assign_rhs2 (second);
2429 /* If jumps are cheap and the target does not support conditional
2430 compare, turn some more codes into jumpy sequences. */
2431 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2432 && targetm.gen_ccmp_first == NULL)
2434 if ((code2 == BIT_AND_EXPR
2435 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2436 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2437 || code2 == TRUTH_AND_EXPR)
2439 code = TRUTH_ANDIF_EXPR;
2440 op0 = gimple_assign_rhs1 (second);
2441 op1 = gimple_assign_rhs2 (second);
2443 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2445 code = TRUTH_ORIF_EXPR;
2446 op0 = gimple_assign_rhs1 (second);
2447 op1 = gimple_assign_rhs2 (second);
2453 last2 = last = get_last_insn ();
2455 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2456 set_curr_insn_location (gimple_location (stmt));
2458 /* These flags have no purpose in RTL land. */
2459 true_edge->flags &= ~EDGE_TRUE_VALUE;
2460 false_edge->flags &= ~EDGE_FALSE_VALUE;
2462 /* We can either have a pure conditional jump with one fallthru edge or
2463 two-way jump that needs to be decomposed into two basic blocks. */
2464 if (false_edge->dest == bb->next_bb)
2466 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2467 true_edge->probability);
2468 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2469 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2470 set_curr_insn_location (true_edge->goto_locus);
2471 false_edge->flags |= EDGE_FALLTHRU;
2472 maybe_cleanup_end_of_block (false_edge, last);
2473 return NULL;
2475 if (true_edge->dest == bb->next_bb)
2477 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2478 false_edge->probability);
2479 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2480 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2481 set_curr_insn_location (false_edge->goto_locus);
2482 true_edge->flags |= EDGE_FALLTHRU;
2483 maybe_cleanup_end_of_block (true_edge, last);
2484 return NULL;
2487 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2488 true_edge->probability);
2489 last = get_last_insn ();
2490 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2491 set_curr_insn_location (false_edge->goto_locus);
2492 emit_jump (label_rtx_for_bb (false_edge->dest));
2494 BB_END (bb) = last;
2495 if (BARRIER_P (BB_END (bb)))
2496 BB_END (bb) = PREV_INSN (BB_END (bb));
2497 update_bb_for_insn (bb);
2499 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2500 dest = false_edge->dest;
2501 redirect_edge_succ (false_edge, new_bb);
2502 false_edge->flags |= EDGE_FALLTHRU;
2503 new_bb->count = false_edge->count;
2504 new_bb->frequency = EDGE_FREQUENCY (false_edge);
2505 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2506 add_bb_to_loop (new_bb, loop);
2507 if (loop->latch == bb
2508 && loop->header == dest)
2509 loop->latch = new_bb;
2510 make_single_succ_edge (new_bb, dest, 0);
2511 if (BARRIER_P (BB_END (new_bb)))
2512 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2513 update_bb_for_insn (new_bb);
2515 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2517 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2519 set_curr_insn_location (true_edge->goto_locus);
2520 true_edge->goto_locus = curr_insn_location ();
2523 return new_bb;
2526 /* Mark all calls that can have a transaction restart. */
2528 static void
2529 mark_transaction_restart_calls (gimple *stmt)
2531 struct tm_restart_node dummy;
2532 tm_restart_node **slot;
2534 if (!cfun->gimple_df->tm_restart)
2535 return;
2537 dummy.stmt = stmt;
2538 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2539 if (slot)
2541 struct tm_restart_node *n = *slot;
2542 tree list = n->label_or_list;
2543 rtx_insn *insn;
2545 for (insn = next_real_insn (get_last_insn ());
2546 !CALL_P (insn);
2547 insn = next_real_insn (insn))
2548 continue;
2550 if (TREE_CODE (list) == LABEL_DECL)
2551 add_reg_note (insn, REG_TM, label_rtx (list));
2552 else
2553 for (; list ; list = TREE_CHAIN (list))
2554 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2558 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2559 statement STMT. */
2561 static void
2562 expand_call_stmt (gcall *stmt)
2564 tree exp, decl, lhs;
2565 bool builtin_p;
2566 size_t i;
2568 if (gimple_call_internal_p (stmt))
2570 expand_internal_call (stmt);
2571 return;
2574 /* If this is a call to a built-in function and it has no effect other
2575 than setting the lhs, try to implement it using an internal function
2576 instead. */
2577 decl = gimple_call_fndecl (stmt);
2578 if (gimple_call_lhs (stmt)
2579 && !gimple_has_side_effects (stmt)
2580 && (optimize || (decl && called_as_built_in (decl))))
2582 internal_fn ifn = replacement_internal_fn (stmt);
2583 if (ifn != IFN_LAST)
2585 expand_internal_call (ifn, stmt);
2586 return;
2590 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2592 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2593 builtin_p = decl && DECL_BUILT_IN (decl);
2595 /* If this is not a builtin function, the function type through which the
2596 call is made may be different from the type of the function. */
2597 if (!builtin_p)
2598 CALL_EXPR_FN (exp)
2599 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2600 CALL_EXPR_FN (exp));
2602 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2603 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2605 for (i = 0; i < gimple_call_num_args (stmt); i++)
2607 tree arg = gimple_call_arg (stmt, i);
2608 gimple *def;
2609 /* TER addresses into arguments of builtin functions so we have a
2610 chance to infer more correct alignment information. See PR39954. */
2611 if (builtin_p
2612 && TREE_CODE (arg) == SSA_NAME
2613 && (def = get_gimple_for_ssa_name (arg))
2614 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2615 arg = gimple_assign_rhs1 (def);
2616 CALL_EXPR_ARG (exp, i) = arg;
2619 if (gimple_has_side_effects (stmt))
2620 TREE_SIDE_EFFECTS (exp) = 1;
2622 if (gimple_call_nothrow_p (stmt))
2623 TREE_NOTHROW (exp) = 1;
2625 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2626 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2627 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2628 if (decl
2629 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
2630 && (DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA
2631 || DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA_WITH_ALIGN))
2632 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2633 else
2634 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2635 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2636 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2637 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2638 CALL_WITH_BOUNDS_P (exp) = gimple_call_with_bounds_p (stmt);
2640 /* Ensure RTL is created for debug args. */
2641 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2643 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2644 unsigned int ix;
2645 tree dtemp;
2647 if (debug_args)
2648 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2650 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2651 expand_debug_expr (dtemp);
2655 lhs = gimple_call_lhs (stmt);
2656 if (lhs)
2657 expand_assignment (lhs, exp, false);
2658 else
2659 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2661 mark_transaction_restart_calls (stmt);
2665 /* Generate RTL for an asm statement (explicit assembler code).
2666 STRING is a STRING_CST node containing the assembler code text,
2667 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2668 insn is volatile; don't optimize it. */
2670 static void
2671 expand_asm_loc (tree string, int vol, location_t locus)
2673 rtx body;
2675 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2676 ggc_strdup (TREE_STRING_POINTER (string)),
2677 locus);
2679 MEM_VOLATILE_P (body) = vol;
2681 /* Non-empty basic ASM implicitly clobbers memory. */
2682 if (TREE_STRING_LENGTH (string) != 0)
2684 rtx asm_op, clob;
2685 unsigned i, nclobbers;
2686 auto_vec<rtx> input_rvec, output_rvec;
2687 auto_vec<const char *> constraints;
2688 auto_vec<rtx> clobber_rvec;
2689 HARD_REG_SET clobbered_regs;
2690 CLEAR_HARD_REG_SET (clobbered_regs);
2692 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2693 clobber_rvec.safe_push (clob);
2695 if (targetm.md_asm_adjust)
2696 targetm.md_asm_adjust (output_rvec, input_rvec,
2697 constraints, clobber_rvec,
2698 clobbered_regs);
2700 asm_op = body;
2701 nclobbers = clobber_rvec.length ();
2702 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nclobbers));
2704 XVECEXP (body, 0, 0) = asm_op;
2705 for (i = 0; i < nclobbers; i++)
2706 XVECEXP (body, 0, i + 1) = gen_rtx_CLOBBER (VOIDmode, clobber_rvec[i]);
2709 emit_insn (body);
2712 /* Return the number of times character C occurs in string S. */
2713 static int
2714 n_occurrences (int c, const char *s)
2716 int n = 0;
2717 while (*s)
2718 n += (*s++ == c);
2719 return n;
2722 /* A subroutine of expand_asm_operands. Check that all operands have
2723 the same number of alternatives. Return true if so. */
2725 static bool
2726 check_operand_nalternatives (const vec<const char *> &constraints)
2728 unsigned len = constraints.length();
2729 if (len > 0)
2731 int nalternatives = n_occurrences (',', constraints[0]);
2733 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2735 error ("too many alternatives in %<asm%>");
2736 return false;
2739 for (unsigned i = 1; i < len; ++i)
2740 if (n_occurrences (',', constraints[i]) != nalternatives)
2742 error ("operand constraints for %<asm%> differ "
2743 "in number of alternatives");
2744 return false;
2747 return true;
2750 /* Check for overlap between registers marked in CLOBBERED_REGS and
2751 anything inappropriate in T. Emit error and return the register
2752 variable definition for error, NULL_TREE for ok. */
2754 static bool
2755 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2757 /* Conflicts between asm-declared register variables and the clobber
2758 list are not allowed. */
2759 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2761 if (overlap)
2763 error ("asm-specifier for variable %qE conflicts with asm clobber list",
2764 DECL_NAME (overlap));
2766 /* Reset registerness to stop multiple errors emitted for a single
2767 variable. */
2768 DECL_REGISTER (overlap) = 0;
2769 return true;
2772 return false;
2775 /* Generate RTL for an asm statement with arguments.
2776 STRING is the instruction template.
2777 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2778 Each output or input has an expression in the TREE_VALUE and
2779 a tree list in TREE_PURPOSE which in turn contains a constraint
2780 name in TREE_VALUE (or NULL_TREE) and a constraint string
2781 in TREE_PURPOSE.
2782 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2783 that is clobbered by this insn.
2785 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2786 should be the fallthru basic block of the asm goto.
2788 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2789 Some elements of OUTPUTS may be replaced with trees representing temporary
2790 values. The caller should copy those temporary values to the originally
2791 specified lvalues.
2793 VOL nonzero means the insn is volatile; don't optimize it. */
2795 static void
2796 expand_asm_stmt (gasm *stmt)
2798 class save_input_location
2800 location_t old;
2802 public:
2803 explicit save_input_location(location_t where)
2805 old = input_location;
2806 input_location = where;
2809 ~save_input_location()
2811 input_location = old;
2815 location_t locus = gimple_location (stmt);
2817 if (gimple_asm_input_p (stmt))
2819 const char *s = gimple_asm_string (stmt);
2820 tree string = build_string (strlen (s), s);
2821 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
2822 return;
2825 /* There are some legacy diagnostics in here, and also avoids a
2826 sixth parameger to targetm.md_asm_adjust. */
2827 save_input_location s_i_l(locus);
2829 unsigned noutputs = gimple_asm_noutputs (stmt);
2830 unsigned ninputs = gimple_asm_ninputs (stmt);
2831 unsigned nlabels = gimple_asm_nlabels (stmt);
2832 unsigned i;
2834 /* ??? Diagnose during gimplification? */
2835 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
2837 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2838 return;
2841 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
2842 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
2843 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
2845 /* Copy the gimple vectors into new vectors that we can manipulate. */
2847 output_tvec.safe_grow (noutputs);
2848 input_tvec.safe_grow (ninputs);
2849 constraints.safe_grow (noutputs + ninputs);
2851 for (i = 0; i < noutputs; ++i)
2853 tree t = gimple_asm_output_op (stmt, i);
2854 output_tvec[i] = TREE_VALUE (t);
2855 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2857 for (i = 0; i < ninputs; i++)
2859 tree t = gimple_asm_input_op (stmt, i);
2860 input_tvec[i] = TREE_VALUE (t);
2861 constraints[i + noutputs]
2862 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2865 /* ??? Diagnose during gimplification? */
2866 if (! check_operand_nalternatives (constraints))
2867 return;
2869 /* Count the number of meaningful clobbered registers, ignoring what
2870 we would ignore later. */
2871 auto_vec<rtx> clobber_rvec;
2872 HARD_REG_SET clobbered_regs;
2873 CLEAR_HARD_REG_SET (clobbered_regs);
2875 if (unsigned n = gimple_asm_nclobbers (stmt))
2877 clobber_rvec.reserve (n);
2878 for (i = 0; i < n; i++)
2880 tree t = gimple_asm_clobber_op (stmt, i);
2881 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
2882 int nregs, j;
2884 j = decode_reg_name_and_count (regname, &nregs);
2885 if (j < 0)
2887 if (j == -2)
2889 /* ??? Diagnose during gimplification? */
2890 error ("unknown register name %qs in %<asm%>", regname);
2892 else if (j == -4)
2894 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2895 clobber_rvec.safe_push (x);
2897 else
2899 /* Otherwise we should have -1 == empty string
2900 or -3 == cc, which is not a register. */
2901 gcc_assert (j == -1 || j == -3);
2904 else
2905 for (int reg = j; reg < j + nregs; reg++)
2907 /* Clobbering the PIC register is an error. */
2908 if (reg == (int) PIC_OFFSET_TABLE_REGNUM)
2910 /* ??? Diagnose during gimplification? */
2911 error ("PIC register clobbered by %qs in %<asm%>",
2912 regname);
2913 return;
2916 SET_HARD_REG_BIT (clobbered_regs, reg);
2917 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
2918 clobber_rvec.safe_push (x);
2922 unsigned nclobbers = clobber_rvec.length();
2924 /* First pass over inputs and outputs checks validity and sets
2925 mark_addressable if needed. */
2926 /* ??? Diagnose during gimplification? */
2928 for (i = 0; i < noutputs; ++i)
2930 tree val = output_tvec[i];
2931 tree type = TREE_TYPE (val);
2932 const char *constraint;
2933 bool is_inout;
2934 bool allows_reg;
2935 bool allows_mem;
2937 /* Try to parse the output constraint. If that fails, there's
2938 no point in going further. */
2939 constraint = constraints[i];
2940 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
2941 &allows_mem, &allows_reg, &is_inout))
2942 return;
2944 if (! allows_reg
2945 && (allows_mem
2946 || is_inout
2947 || (DECL_P (val)
2948 && REG_P (DECL_RTL (val))
2949 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
2950 mark_addressable (val);
2953 for (i = 0; i < ninputs; ++i)
2955 bool allows_reg, allows_mem;
2956 const char *constraint;
2958 constraint = constraints[i + noutputs];
2959 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
2960 constraints.address (),
2961 &allows_mem, &allows_reg))
2962 return;
2964 if (! allows_reg && allows_mem)
2965 mark_addressable (input_tvec[i]);
2968 /* Second pass evaluates arguments. */
2970 /* Make sure stack is consistent for asm goto. */
2971 if (nlabels > 0)
2972 do_pending_stack_adjust ();
2973 int old_generating_concat_p = generating_concat_p;
2975 /* Vector of RTX's of evaluated output operands. */
2976 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
2977 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
2978 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
2980 output_rvec.safe_grow (noutputs);
2982 for (i = 0; i < noutputs; ++i)
2984 tree val = output_tvec[i];
2985 tree type = TREE_TYPE (val);
2986 bool is_inout, allows_reg, allows_mem, ok;
2987 rtx op;
2989 ok = parse_output_constraint (&constraints[i], i, ninputs,
2990 noutputs, &allows_mem, &allows_reg,
2991 &is_inout);
2992 gcc_assert (ok);
2994 /* If an output operand is not a decl or indirect ref and our constraint
2995 allows a register, make a temporary to act as an intermediate.
2996 Make the asm insn write into that, then we will copy it to
2997 the real output operand. Likewise for promoted variables. */
2999 generating_concat_p = 0;
3001 if ((TREE_CODE (val) == INDIRECT_REF
3002 && allows_mem)
3003 || (DECL_P (val)
3004 && (allows_mem || REG_P (DECL_RTL (val)))
3005 && ! (REG_P (DECL_RTL (val))
3006 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3007 || ! allows_reg
3008 || is_inout)
3010 op = expand_expr (val, NULL_RTX, VOIDmode,
3011 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3012 if (MEM_P (op))
3013 op = validize_mem (op);
3015 if (! allows_reg && !MEM_P (op))
3016 error ("output number %d not directly addressable", i);
3017 if ((! allows_mem && MEM_P (op))
3018 || GET_CODE (op) == CONCAT)
3020 rtx old_op = op;
3021 op = gen_reg_rtx (GET_MODE (op));
3023 generating_concat_p = old_generating_concat_p;
3025 if (is_inout)
3026 emit_move_insn (op, old_op);
3028 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3029 emit_move_insn (old_op, op);
3030 after_rtl_seq = get_insns ();
3031 after_rtl_end = get_last_insn ();
3032 end_sequence ();
3035 else
3037 op = assign_temp (type, 0, 1);
3038 op = validize_mem (op);
3039 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3040 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3042 generating_concat_p = old_generating_concat_p;
3044 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3045 expand_assignment (val, make_tree (type, op), false);
3046 after_rtl_seq = get_insns ();
3047 after_rtl_end = get_last_insn ();
3048 end_sequence ();
3050 output_rvec[i] = op;
3052 if (is_inout)
3053 inout_opnum.safe_push (i);
3056 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3057 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3059 input_rvec.safe_grow (ninputs);
3060 input_mode.safe_grow (ninputs);
3062 generating_concat_p = 0;
3064 for (i = 0; i < ninputs; ++i)
3066 tree val = input_tvec[i];
3067 tree type = TREE_TYPE (val);
3068 bool allows_reg, allows_mem, ok;
3069 const char *constraint;
3070 rtx op;
3072 constraint = constraints[i + noutputs];
3073 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3074 constraints.address (),
3075 &allows_mem, &allows_reg);
3076 gcc_assert (ok);
3078 /* EXPAND_INITIALIZER will not generate code for valid initializer
3079 constants, but will still generate code for other types of operand.
3080 This is the behavior we want for constant constraints. */
3081 op = expand_expr (val, NULL_RTX, VOIDmode,
3082 allows_reg ? EXPAND_NORMAL
3083 : allows_mem ? EXPAND_MEMORY
3084 : EXPAND_INITIALIZER);
3086 /* Never pass a CONCAT to an ASM. */
3087 if (GET_CODE (op) == CONCAT)
3088 op = force_reg (GET_MODE (op), op);
3089 else if (MEM_P (op))
3090 op = validize_mem (op);
3092 if (asm_operand_ok (op, constraint, NULL) <= 0)
3094 if (allows_reg && TYPE_MODE (type) != BLKmode)
3095 op = force_reg (TYPE_MODE (type), op);
3096 else if (!allows_mem)
3097 warning (0, "asm operand %d probably doesn%'t match constraints",
3098 i + noutputs);
3099 else if (MEM_P (op))
3101 /* We won't recognize either volatile memory or memory
3102 with a queued address as available a memory_operand
3103 at this point. Ignore it: clearly this *is* a memory. */
3105 else
3106 gcc_unreachable ();
3108 input_rvec[i] = op;
3109 input_mode[i] = TYPE_MODE (type);
3112 /* For in-out operands, copy output rtx to input rtx. */
3113 unsigned ninout = inout_opnum.length();
3114 for (i = 0; i < ninout; i++)
3116 int j = inout_opnum[i];
3117 rtx o = output_rvec[j];
3119 input_rvec.safe_push (o);
3120 input_mode.safe_push (GET_MODE (o));
3122 char buffer[16];
3123 sprintf (buffer, "%d", j);
3124 constraints.safe_push (ggc_strdup (buffer));
3126 ninputs += ninout;
3128 /* Sometimes we wish to automatically clobber registers across an asm.
3129 Case in point is when the i386 backend moved from cc0 to a hard reg --
3130 maintaining source-level compatibility means automatically clobbering
3131 the flags register. */
3132 rtx_insn *after_md_seq = NULL;
3133 if (targetm.md_asm_adjust)
3134 after_md_seq = targetm.md_asm_adjust (output_rvec, input_rvec,
3135 constraints, clobber_rvec,
3136 clobbered_regs);
3138 /* Do not allow the hook to change the output and input count,
3139 lest it mess up the operand numbering. */
3140 gcc_assert (output_rvec.length() == noutputs);
3141 gcc_assert (input_rvec.length() == ninputs);
3142 gcc_assert (constraints.length() == noutputs + ninputs);
3144 /* But it certainly can adjust the clobbers. */
3145 nclobbers = clobber_rvec.length();
3147 /* Third pass checks for easy conflicts. */
3148 /* ??? Why are we doing this on trees instead of rtx. */
3150 bool clobber_conflict_found = 0;
3151 for (i = 0; i < noutputs; ++i)
3152 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3153 clobber_conflict_found = 1;
3154 for (i = 0; i < ninputs - ninout; ++i)
3155 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3156 clobber_conflict_found = 1;
3158 /* Make vectors for the expression-rtx, constraint strings,
3159 and named operands. */
3161 rtvec argvec = rtvec_alloc (ninputs);
3162 rtvec constraintvec = rtvec_alloc (ninputs);
3163 rtvec labelvec = rtvec_alloc (nlabels);
3165 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3166 : GET_MODE (output_rvec[0])),
3167 ggc_strdup (gimple_asm_string (stmt)),
3168 "", 0, argvec, constraintvec,
3169 labelvec, locus);
3170 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3172 for (i = 0; i < ninputs; ++i)
3174 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3175 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3176 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3177 constraints[i + noutputs],
3178 locus);
3181 /* Copy labels to the vector. */
3182 rtx_code_label *fallthru_label = NULL;
3183 if (nlabels > 0)
3185 basic_block fallthru_bb = NULL;
3186 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3187 if (fallthru)
3188 fallthru_bb = fallthru->dest;
3190 for (i = 0; i < nlabels; ++i)
3192 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3193 rtx_insn *r;
3194 /* If asm goto has any labels in the fallthru basic block, use
3195 a label that we emit immediately after the asm goto. Expansion
3196 may insert further instructions into the same basic block after
3197 asm goto and if we don't do this, insertion of instructions on
3198 the fallthru edge might misbehave. See PR58670. */
3199 if (fallthru_bb && label_to_block_fn (cfun, label) == fallthru_bb)
3201 if (fallthru_label == NULL_RTX)
3202 fallthru_label = gen_label_rtx ();
3203 r = fallthru_label;
3205 else
3206 r = label_rtx (label);
3207 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3211 /* Now, for each output, construct an rtx
3212 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3213 ARGVEC CONSTRAINTS OPNAMES))
3214 If there is more than one, put them inside a PARALLEL. */
3216 if (nlabels > 0 && nclobbers == 0)
3218 gcc_assert (noutputs == 0);
3219 emit_jump_insn (body);
3221 else if (noutputs == 0 && nclobbers == 0)
3223 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3224 emit_insn (body);
3226 else if (noutputs == 1 && nclobbers == 0)
3228 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3229 emit_insn (gen_rtx_SET (output_rvec[0], body));
3231 else
3233 rtx obody = body;
3234 int num = noutputs;
3236 if (num == 0)
3237 num = 1;
3239 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3241 /* For each output operand, store a SET. */
3242 for (i = 0; i < noutputs; ++i)
3244 rtx src, o = output_rvec[i];
3245 if (i == 0)
3247 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3248 src = obody;
3250 else
3252 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3253 ASM_OPERANDS_TEMPLATE (obody),
3254 constraints[i], i, argvec,
3255 constraintvec, labelvec, locus);
3256 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3258 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3261 /* If there are no outputs (but there are some clobbers)
3262 store the bare ASM_OPERANDS into the PARALLEL. */
3263 if (i == 0)
3264 XVECEXP (body, 0, i++) = obody;
3266 /* Store (clobber REG) for each clobbered register specified. */
3267 for (unsigned j = 0; j < nclobbers; ++j)
3269 rtx clobbered_reg = clobber_rvec[j];
3271 /* Do sanity check for overlap between clobbers and respectively
3272 input and outputs that hasn't been handled. Such overlap
3273 should have been detected and reported above. */
3274 if (!clobber_conflict_found && REG_P (clobbered_reg))
3276 /* We test the old body (obody) contents to avoid
3277 tripping over the under-construction body. */
3278 for (unsigned k = 0; k < noutputs; ++k)
3279 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3280 internal_error ("asm clobber conflict with output operand");
3282 for (unsigned k = 0; k < ninputs - ninout; ++k)
3283 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3284 internal_error ("asm clobber conflict with input operand");
3287 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3290 if (nlabels > 0)
3291 emit_jump_insn (body);
3292 else
3293 emit_insn (body);
3296 generating_concat_p = old_generating_concat_p;
3298 if (fallthru_label)
3299 emit_label (fallthru_label);
3301 if (after_md_seq)
3302 emit_insn (after_md_seq);
3303 if (after_rtl_seq)
3304 emit_insn (after_rtl_seq);
3306 free_temp_slots ();
3307 crtl->has_asm_statement = 1;
3310 /* Emit code to jump to the address
3311 specified by the pointer expression EXP. */
3313 static void
3314 expand_computed_goto (tree exp)
3316 rtx x = expand_normal (exp);
3318 do_pending_stack_adjust ();
3319 emit_indirect_jump (x);
3322 /* Generate RTL code for a `goto' statement with target label LABEL.
3323 LABEL should be a LABEL_DECL tree node that was or will later be
3324 defined with `expand_label'. */
3326 static void
3327 expand_goto (tree label)
3329 if (flag_checking)
3331 /* Check for a nonlocal goto to a containing function. Should have
3332 gotten translated to __builtin_nonlocal_goto. */
3333 tree context = decl_function_context (label);
3334 gcc_assert (!context || context == current_function_decl);
3337 emit_jump (jump_target_rtx (label));
3340 /* Output a return with no value. */
3342 static void
3343 expand_null_return_1 (void)
3345 clear_pending_stack_adjust ();
3346 do_pending_stack_adjust ();
3347 emit_jump (return_label);
3350 /* Generate RTL to return from the current function, with no value.
3351 (That is, we do not do anything about returning any value.) */
3353 void
3354 expand_null_return (void)
3356 /* If this function was declared to return a value, but we
3357 didn't, clobber the return registers so that they are not
3358 propagated live to the rest of the function. */
3359 clobber_return_register ();
3361 expand_null_return_1 ();
3364 /* Generate RTL to return from the current function, with value VAL. */
3366 static void
3367 expand_value_return (rtx val)
3369 /* Copy the value to the return location unless it's already there. */
3371 tree decl = DECL_RESULT (current_function_decl);
3372 rtx return_reg = DECL_RTL (decl);
3373 if (return_reg != val)
3375 tree funtype = TREE_TYPE (current_function_decl);
3376 tree type = TREE_TYPE (decl);
3377 int unsignedp = TYPE_UNSIGNED (type);
3378 machine_mode old_mode = DECL_MODE (decl);
3379 machine_mode mode;
3380 if (DECL_BY_REFERENCE (decl))
3381 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3382 else
3383 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3385 if (mode != old_mode)
3386 val = convert_modes (mode, old_mode, val, unsignedp);
3388 if (GET_CODE (return_reg) == PARALLEL)
3389 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3390 else
3391 emit_move_insn (return_reg, val);
3394 expand_null_return_1 ();
3397 /* Generate RTL to evaluate the expression RETVAL and return it
3398 from the current function. */
3400 static void
3401 expand_return (tree retval, tree bounds)
3403 rtx result_rtl;
3404 rtx val = 0;
3405 tree retval_rhs;
3406 rtx bounds_rtl;
3408 /* If function wants no value, give it none. */
3409 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3411 expand_normal (retval);
3412 expand_null_return ();
3413 return;
3416 if (retval == error_mark_node)
3418 /* Treat this like a return of no value from a function that
3419 returns a value. */
3420 expand_null_return ();
3421 return;
3423 else if ((TREE_CODE (retval) == MODIFY_EXPR
3424 || TREE_CODE (retval) == INIT_EXPR)
3425 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3426 retval_rhs = TREE_OPERAND (retval, 1);
3427 else
3428 retval_rhs = retval;
3430 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3432 /* Put returned bounds to the right place. */
3433 bounds_rtl = DECL_BOUNDS_RTL (DECL_RESULT (current_function_decl));
3434 if (bounds_rtl)
3436 rtx addr = NULL;
3437 rtx bnd = NULL;
3439 if (bounds && bounds != error_mark_node)
3441 bnd = expand_normal (bounds);
3442 targetm.calls.store_returned_bounds (bounds_rtl, bnd);
3444 else if (REG_P (bounds_rtl))
3446 if (bounds)
3447 bnd = chkp_expand_zero_bounds ();
3448 else
3450 addr = expand_normal (build_fold_addr_expr (retval_rhs));
3451 addr = gen_rtx_MEM (Pmode, addr);
3452 bnd = targetm.calls.load_bounds_for_arg (addr, NULL, NULL);
3455 targetm.calls.store_returned_bounds (bounds_rtl, bnd);
3457 else
3459 int n;
3461 gcc_assert (GET_CODE (bounds_rtl) == PARALLEL);
3463 if (bounds)
3464 bnd = chkp_expand_zero_bounds ();
3465 else
3467 addr = expand_normal (build_fold_addr_expr (retval_rhs));
3468 addr = gen_rtx_MEM (Pmode, addr);
3471 for (n = 0; n < XVECLEN (bounds_rtl, 0); n++)
3473 rtx slot = XEXP (XVECEXP (bounds_rtl, 0, n), 0);
3474 if (!bounds)
3476 rtx offs = XEXP (XVECEXP (bounds_rtl, 0, n), 1);
3477 rtx from = adjust_address (addr, Pmode, INTVAL (offs));
3478 bnd = targetm.calls.load_bounds_for_arg (from, NULL, NULL);
3480 targetm.calls.store_returned_bounds (slot, bnd);
3484 else if (chkp_function_instrumented_p (current_function_decl)
3485 && !BOUNDED_P (retval_rhs)
3486 && chkp_type_has_pointer (TREE_TYPE (retval_rhs))
3487 && TREE_CODE (retval_rhs) != RESULT_DECL)
3489 rtx addr = expand_normal (build_fold_addr_expr (retval_rhs));
3490 addr = gen_rtx_MEM (Pmode, addr);
3492 gcc_assert (MEM_P (result_rtl));
3494 chkp_copy_bounds_for_stack_parm (result_rtl, addr, TREE_TYPE (retval_rhs));
3497 /* If we are returning the RESULT_DECL, then the value has already
3498 been stored into it, so we don't have to do anything special. */
3499 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3500 expand_value_return (result_rtl);
3502 /* If the result is an aggregate that is being returned in one (or more)
3503 registers, load the registers here. */
3505 else if (retval_rhs != 0
3506 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3507 && REG_P (result_rtl))
3509 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3510 if (val)
3512 /* Use the mode of the result value on the return register. */
3513 PUT_MODE (result_rtl, GET_MODE (val));
3514 expand_value_return (val);
3516 else
3517 expand_null_return ();
3519 else if (retval_rhs != 0
3520 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3521 && (REG_P (result_rtl)
3522 || (GET_CODE (result_rtl) == PARALLEL)))
3524 /* Compute the return value into a temporary (usually a pseudo reg). */
3526 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3527 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3528 val = force_not_mem (val);
3529 expand_value_return (val);
3531 else
3533 /* No hard reg used; calculate value into hard return reg. */
3534 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3535 expand_value_return (result_rtl);
3539 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3540 STMT that doesn't require special handling for outgoing edges. That
3541 is no tailcalls and no GIMPLE_COND. */
3543 static void
3544 expand_gimple_stmt_1 (gimple *stmt)
3546 tree op0;
3548 set_curr_insn_location (gimple_location (stmt));
3550 switch (gimple_code (stmt))
3552 case GIMPLE_GOTO:
3553 op0 = gimple_goto_dest (stmt);
3554 if (TREE_CODE (op0) == LABEL_DECL)
3555 expand_goto (op0);
3556 else
3557 expand_computed_goto (op0);
3558 break;
3559 case GIMPLE_LABEL:
3560 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3561 break;
3562 case GIMPLE_NOP:
3563 case GIMPLE_PREDICT:
3564 break;
3565 case GIMPLE_SWITCH:
3567 gswitch *swtch = as_a <gswitch *> (stmt);
3568 if (gimple_switch_num_labels (swtch) == 1)
3569 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3570 else
3571 expand_case (swtch);
3573 break;
3574 case GIMPLE_ASM:
3575 expand_asm_stmt (as_a <gasm *> (stmt));
3576 break;
3577 case GIMPLE_CALL:
3578 expand_call_stmt (as_a <gcall *> (stmt));
3579 break;
3581 case GIMPLE_RETURN:
3583 tree bnd = gimple_return_retbnd (as_a <greturn *> (stmt));
3584 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3586 if (op0 && op0 != error_mark_node)
3588 tree result = DECL_RESULT (current_function_decl);
3590 /* Mark we have return statement with missing bounds. */
3591 if (!bnd
3592 && chkp_function_instrumented_p (cfun->decl)
3593 && !DECL_P (op0))
3594 bnd = error_mark_node;
3596 /* If we are not returning the current function's RESULT_DECL,
3597 build an assignment to it. */
3598 if (op0 != result)
3600 /* I believe that a function's RESULT_DECL is unique. */
3601 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3603 /* ??? We'd like to use simply expand_assignment here,
3604 but this fails if the value is of BLKmode but the return
3605 decl is a register. expand_return has special handling
3606 for this combination, which eventually should move
3607 to common code. See comments there. Until then, let's
3608 build a modify expression :-/ */
3609 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3610 result, op0);
3614 if (!op0)
3615 expand_null_return ();
3616 else
3617 expand_return (op0, bnd);
3619 break;
3621 case GIMPLE_ASSIGN:
3623 gassign *assign_stmt = as_a <gassign *> (stmt);
3624 tree lhs = gimple_assign_lhs (assign_stmt);
3626 /* Tree expand used to fiddle with |= and &= of two bitfield
3627 COMPONENT_REFs here. This can't happen with gimple, the LHS
3628 of binary assigns must be a gimple reg. */
3630 if (TREE_CODE (lhs) != SSA_NAME
3631 || get_gimple_rhs_class (gimple_expr_code (stmt))
3632 == GIMPLE_SINGLE_RHS)
3634 tree rhs = gimple_assign_rhs1 (assign_stmt);
3635 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt))
3636 == GIMPLE_SINGLE_RHS);
3637 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3638 /* Do not put locations on possibly shared trees. */
3639 && !is_gimple_min_invariant (rhs))
3640 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3641 if (TREE_CLOBBER_P (rhs))
3642 /* This is a clobber to mark the going out of scope for
3643 this LHS. */
3645 else
3646 expand_assignment (lhs, rhs,
3647 gimple_assign_nontemporal_move_p (
3648 assign_stmt));
3650 else
3652 rtx target, temp;
3653 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3654 struct separate_ops ops;
3655 bool promoted = false;
3657 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3658 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3659 promoted = true;
3661 ops.code = gimple_assign_rhs_code (assign_stmt);
3662 ops.type = TREE_TYPE (lhs);
3663 switch (get_gimple_rhs_class (ops.code))
3665 case GIMPLE_TERNARY_RHS:
3666 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3667 /* Fallthru */
3668 case GIMPLE_BINARY_RHS:
3669 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3670 /* Fallthru */
3671 case GIMPLE_UNARY_RHS:
3672 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3673 break;
3674 default:
3675 gcc_unreachable ();
3677 ops.location = gimple_location (stmt);
3679 /* If we want to use a nontemporal store, force the value to
3680 register first. If we store into a promoted register,
3681 don't directly expand to target. */
3682 temp = nontemporal || promoted ? NULL_RTX : target;
3683 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3684 EXPAND_NORMAL);
3686 if (temp == target)
3688 else if (promoted)
3690 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3691 /* If TEMP is a VOIDmode constant, use convert_modes to make
3692 sure that we properly convert it. */
3693 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3695 temp = convert_modes (GET_MODE (target),
3696 TYPE_MODE (ops.type),
3697 temp, unsignedp);
3698 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3699 GET_MODE (target), temp, unsignedp);
3702 convert_move (SUBREG_REG (target), temp, unsignedp);
3704 else if (nontemporal && emit_storent_insn (target, temp))
3706 else
3708 temp = force_operand (temp, target);
3709 if (temp != target)
3710 emit_move_insn (target, temp);
3714 break;
3716 default:
3717 gcc_unreachable ();
3721 /* Expand one gimple statement STMT and return the last RTL instruction
3722 before any of the newly generated ones.
3724 In addition to generating the necessary RTL instructions this also
3725 sets REG_EH_REGION notes if necessary and sets the current source
3726 location for diagnostics. */
3728 static rtx_insn *
3729 expand_gimple_stmt (gimple *stmt)
3731 location_t saved_location = input_location;
3732 rtx_insn *last = get_last_insn ();
3733 int lp_nr;
3735 gcc_assert (cfun);
3737 /* We need to save and restore the current source location so that errors
3738 discovered during expansion are emitted with the right location. But
3739 it would be better if the diagnostic routines used the source location
3740 embedded in the tree nodes rather than globals. */
3741 if (gimple_has_location (stmt))
3742 input_location = gimple_location (stmt);
3744 expand_gimple_stmt_1 (stmt);
3746 /* Free any temporaries used to evaluate this statement. */
3747 free_temp_slots ();
3749 input_location = saved_location;
3751 /* Mark all insns that may trap. */
3752 lp_nr = lookup_stmt_eh_lp (stmt);
3753 if (lp_nr)
3755 rtx_insn *insn;
3756 for (insn = next_real_insn (last); insn;
3757 insn = next_real_insn (insn))
3759 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3760 /* If we want exceptions for non-call insns, any
3761 may_trap_p instruction may throw. */
3762 && GET_CODE (PATTERN (insn)) != CLOBBER
3763 && GET_CODE (PATTERN (insn)) != USE
3764 && insn_could_throw_p (insn))
3765 make_reg_eh_region_note (insn, 0, lp_nr);
3769 return last;
3772 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3773 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3774 generated a tail call (something that might be denied by the ABI
3775 rules governing the call; see calls.c).
3777 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3778 can still reach the rest of BB. The case here is __builtin_sqrt,
3779 where the NaN result goes through the external function (with a
3780 tailcall) and the normal result happens via a sqrt instruction. */
3782 static basic_block
3783 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
3785 rtx_insn *last2, *last;
3786 edge e;
3787 edge_iterator ei;
3788 profile_probability probability;
3790 last2 = last = expand_gimple_stmt (stmt);
3792 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3793 if (CALL_P (last) && SIBLING_CALL_P (last))
3794 goto found;
3796 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3798 *can_fallthru = true;
3799 return NULL;
3801 found:
3802 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3803 Any instructions emitted here are about to be deleted. */
3804 do_pending_stack_adjust ();
3806 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3807 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3808 EH or abnormal edges, we shouldn't have created a tail call in
3809 the first place. So it seems to me we should just be removing
3810 all edges here, or redirecting the existing fallthru edge to
3811 the exit block. */
3813 probability = profile_probability::never ();
3814 profile_count count = profile_count::zero ();
3816 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3818 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3820 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3822 e->dest->count -= e->count;
3823 e->dest->frequency -= EDGE_FREQUENCY (e);
3824 if (e->dest->frequency < 0)
3825 e->dest->frequency = 0;
3827 count += e->count;
3828 probability += e->probability;
3829 remove_edge (e);
3831 else
3832 ei_next (&ei);
3835 /* This is somewhat ugly: the call_expr expander often emits instructions
3836 after the sibcall (to perform the function return). These confuse the
3837 find_many_sub_basic_blocks code, so we need to get rid of these. */
3838 last = NEXT_INSN (last);
3839 gcc_assert (BARRIER_P (last));
3841 *can_fallthru = false;
3842 while (NEXT_INSN (last))
3844 /* For instance an sqrt builtin expander expands if with
3845 sibcall in the then and label for `else`. */
3846 if (LABEL_P (NEXT_INSN (last)))
3848 *can_fallthru = true;
3849 break;
3851 delete_insn (NEXT_INSN (last));
3854 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3855 | EDGE_SIBCALL);
3856 e->probability = probability;
3857 e->count = count;
3858 BB_END (bb) = last;
3859 update_bb_for_insn (bb);
3861 if (NEXT_INSN (last))
3863 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3865 last = BB_END (bb);
3866 if (BARRIER_P (last))
3867 BB_END (bb) = PREV_INSN (last);
3870 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3872 return bb;
3875 /* Return the difference between the floor and the truncated result of
3876 a signed division by OP1 with remainder MOD. */
3877 static rtx
3878 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3880 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
3881 return gen_rtx_IF_THEN_ELSE
3882 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3883 gen_rtx_IF_THEN_ELSE
3884 (mode, gen_rtx_LT (BImode,
3885 gen_rtx_DIV (mode, op1, mod),
3886 const0_rtx),
3887 constm1_rtx, const0_rtx),
3888 const0_rtx);
3891 /* Return the difference between the ceil and the truncated result of
3892 a signed division by OP1 with remainder MOD. */
3893 static rtx
3894 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3896 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
3897 return gen_rtx_IF_THEN_ELSE
3898 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3899 gen_rtx_IF_THEN_ELSE
3900 (mode, gen_rtx_GT (BImode,
3901 gen_rtx_DIV (mode, op1, mod),
3902 const0_rtx),
3903 const1_rtx, const0_rtx),
3904 const0_rtx);
3907 /* Return the difference between the ceil and the truncated result of
3908 an unsigned division by OP1 with remainder MOD. */
3909 static rtx
3910 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
3912 /* (mod != 0 ? 1 : 0) */
3913 return gen_rtx_IF_THEN_ELSE
3914 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3915 const1_rtx, const0_rtx);
3918 /* Return the difference between the rounded and the truncated result
3919 of a signed division by OP1 with remainder MOD. Halfway cases are
3920 rounded away from zero, rather than to the nearest even number. */
3921 static rtx
3922 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3924 /* (abs (mod) >= abs (op1) - abs (mod)
3925 ? (op1 / mod > 0 ? 1 : -1)
3926 : 0) */
3927 return gen_rtx_IF_THEN_ELSE
3928 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
3929 gen_rtx_MINUS (mode,
3930 gen_rtx_ABS (mode, op1),
3931 gen_rtx_ABS (mode, mod))),
3932 gen_rtx_IF_THEN_ELSE
3933 (mode, gen_rtx_GT (BImode,
3934 gen_rtx_DIV (mode, op1, mod),
3935 const0_rtx),
3936 const1_rtx, constm1_rtx),
3937 const0_rtx);
3940 /* Return the difference between the rounded and the truncated result
3941 of a unsigned division by OP1 with remainder MOD. Halfway cases
3942 are rounded away from zero, rather than to the nearest even
3943 number. */
3944 static rtx
3945 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
3947 /* (mod >= op1 - mod ? 1 : 0) */
3948 return gen_rtx_IF_THEN_ELSE
3949 (mode, gen_rtx_GE (BImode, mod,
3950 gen_rtx_MINUS (mode, op1, mod)),
3951 const1_rtx, const0_rtx);
3954 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
3955 any rtl. */
3957 static rtx
3958 convert_debug_memory_address (machine_mode mode, rtx x,
3959 addr_space_t as)
3961 machine_mode xmode = GET_MODE (x);
3963 #ifndef POINTERS_EXTEND_UNSIGNED
3964 gcc_assert (mode == Pmode
3965 || mode == targetm.addr_space.address_mode (as));
3966 gcc_assert (xmode == mode || xmode == VOIDmode);
3967 #else
3968 rtx temp;
3970 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
3972 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
3973 return x;
3975 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
3976 x = lowpart_subreg (mode, x, xmode);
3977 else if (POINTERS_EXTEND_UNSIGNED > 0)
3978 x = gen_rtx_ZERO_EXTEND (mode, x);
3979 else if (!POINTERS_EXTEND_UNSIGNED)
3980 x = gen_rtx_SIGN_EXTEND (mode, x);
3981 else
3983 switch (GET_CODE (x))
3985 case SUBREG:
3986 if ((SUBREG_PROMOTED_VAR_P (x)
3987 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
3988 || (GET_CODE (SUBREG_REG (x)) == PLUS
3989 && REG_P (XEXP (SUBREG_REG (x), 0))
3990 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
3991 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
3992 && GET_MODE (SUBREG_REG (x)) == mode)
3993 return SUBREG_REG (x);
3994 break;
3995 case LABEL_REF:
3996 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
3997 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
3998 return temp;
3999 case SYMBOL_REF:
4000 temp = shallow_copy_rtx (x);
4001 PUT_MODE (temp, mode);
4002 return temp;
4003 case CONST:
4004 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4005 if (temp)
4006 temp = gen_rtx_CONST (mode, temp);
4007 return temp;
4008 case PLUS:
4009 case MINUS:
4010 if (CONST_INT_P (XEXP (x, 1)))
4012 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4013 if (temp)
4014 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4016 break;
4017 default:
4018 break;
4020 /* Don't know how to express ptr_extend as operation in debug info. */
4021 return NULL;
4023 #endif /* POINTERS_EXTEND_UNSIGNED */
4025 return x;
4028 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4029 by avoid_deep_ter_for_debug. */
4031 static hash_map<tree, tree> *deep_ter_debug_map;
4033 /* Split too deep TER chains for debug stmts using debug temporaries. */
4035 static void
4036 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4038 use_operand_p use_p;
4039 ssa_op_iter iter;
4040 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4042 tree use = USE_FROM_PTR (use_p);
4043 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4044 continue;
4045 gimple *g = get_gimple_for_ssa_name (use);
4046 if (g == NULL)
4047 continue;
4048 if (depth > 6 && !stmt_ends_bb_p (g))
4050 if (deep_ter_debug_map == NULL)
4051 deep_ter_debug_map = new hash_map<tree, tree>;
4053 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4054 if (vexpr != NULL)
4055 continue;
4056 vexpr = make_node (DEBUG_EXPR_DECL);
4057 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4058 DECL_ARTIFICIAL (vexpr) = 1;
4059 TREE_TYPE (vexpr) = TREE_TYPE (use);
4060 SET_DECL_MODE (vexpr, TYPE_MODE (TREE_TYPE (use)));
4061 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4062 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4063 avoid_deep_ter_for_debug (def_temp, 0);
4065 else
4066 avoid_deep_ter_for_debug (g, depth + 1);
4070 /* Return an RTX equivalent to the value of the parameter DECL. */
4072 static rtx
4073 expand_debug_parm_decl (tree decl)
4075 rtx incoming = DECL_INCOMING_RTL (decl);
4077 if (incoming
4078 && GET_MODE (incoming) != BLKmode
4079 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4080 || (MEM_P (incoming)
4081 && REG_P (XEXP (incoming, 0))
4082 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4084 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4086 #ifdef HAVE_window_save
4087 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4088 If the target machine has an explicit window save instruction, the
4089 actual entry value is the corresponding OUTGOING_REGNO instead. */
4090 if (REG_P (incoming)
4091 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4092 incoming
4093 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4094 OUTGOING_REGNO (REGNO (incoming)), 0);
4095 else if (MEM_P (incoming))
4097 rtx reg = XEXP (incoming, 0);
4098 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4100 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4101 incoming = replace_equiv_address_nv (incoming, reg);
4103 else
4104 incoming = copy_rtx (incoming);
4106 #endif
4108 ENTRY_VALUE_EXP (rtl) = incoming;
4109 return rtl;
4112 if (incoming
4113 && GET_MODE (incoming) != BLKmode
4114 && !TREE_ADDRESSABLE (decl)
4115 && MEM_P (incoming)
4116 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4117 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4118 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4119 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4120 return copy_rtx (incoming);
4122 return NULL_RTX;
4125 /* Return an RTX equivalent to the value of the tree expression EXP. */
4127 static rtx
4128 expand_debug_expr (tree exp)
4130 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4131 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4132 machine_mode inner_mode = VOIDmode;
4133 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4134 addr_space_t as;
4136 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4138 case tcc_expression:
4139 switch (TREE_CODE (exp))
4141 case COND_EXPR:
4142 case DOT_PROD_EXPR:
4143 case SAD_EXPR:
4144 case WIDEN_MULT_PLUS_EXPR:
4145 case WIDEN_MULT_MINUS_EXPR:
4146 case FMA_EXPR:
4147 goto ternary;
4149 case TRUTH_ANDIF_EXPR:
4150 case TRUTH_ORIF_EXPR:
4151 case TRUTH_AND_EXPR:
4152 case TRUTH_OR_EXPR:
4153 case TRUTH_XOR_EXPR:
4154 goto binary;
4156 case TRUTH_NOT_EXPR:
4157 goto unary;
4159 default:
4160 break;
4162 break;
4164 ternary:
4165 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4166 if (!op2)
4167 return NULL_RTX;
4168 /* Fall through. */
4170 binary:
4171 case tcc_binary:
4172 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4173 if (!op1)
4174 return NULL_RTX;
4175 switch (TREE_CODE (exp))
4177 case LSHIFT_EXPR:
4178 case RSHIFT_EXPR:
4179 case LROTATE_EXPR:
4180 case RROTATE_EXPR:
4181 case WIDEN_LSHIFT_EXPR:
4182 /* Ensure second operand isn't wider than the first one. */
4183 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4184 if (SCALAR_INT_MODE_P (inner_mode))
4186 machine_mode opmode = mode;
4187 if (VECTOR_MODE_P (mode))
4188 opmode = GET_MODE_INNER (mode);
4189 if (SCALAR_INT_MODE_P (opmode)
4190 && (GET_MODE_PRECISION (opmode)
4191 < GET_MODE_PRECISION (inner_mode)))
4192 op1 = lowpart_subreg (opmode, op1, inner_mode);
4194 break;
4195 default:
4196 break;
4198 /* Fall through. */
4200 unary:
4201 case tcc_unary:
4202 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4203 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4204 if (!op0)
4205 return NULL_RTX;
4206 break;
4208 case tcc_comparison:
4209 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4210 goto binary;
4212 case tcc_type:
4213 case tcc_statement:
4214 gcc_unreachable ();
4216 case tcc_constant:
4217 case tcc_exceptional:
4218 case tcc_declaration:
4219 case tcc_reference:
4220 case tcc_vl_exp:
4221 break;
4224 switch (TREE_CODE (exp))
4226 case STRING_CST:
4227 if (!lookup_constant_def (exp))
4229 if (strlen (TREE_STRING_POINTER (exp)) + 1
4230 != (size_t) TREE_STRING_LENGTH (exp))
4231 return NULL_RTX;
4232 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4233 op0 = gen_rtx_MEM (BLKmode, op0);
4234 set_mem_attributes (op0, exp, 0);
4235 return op0;
4237 /* Fall through. */
4239 case INTEGER_CST:
4240 case REAL_CST:
4241 case FIXED_CST:
4242 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4243 return op0;
4245 case COMPLEX_CST:
4246 gcc_assert (COMPLEX_MODE_P (mode));
4247 op0 = expand_debug_expr (TREE_REALPART (exp));
4248 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4249 return gen_rtx_CONCAT (mode, op0, op1);
4251 case DEBUG_EXPR_DECL:
4252 op0 = DECL_RTL_IF_SET (exp);
4254 if (op0)
4255 return op0;
4257 op0 = gen_rtx_DEBUG_EXPR (mode);
4258 DEBUG_EXPR_TREE_DECL (op0) = exp;
4259 SET_DECL_RTL (exp, op0);
4261 return op0;
4263 case VAR_DECL:
4264 case PARM_DECL:
4265 case FUNCTION_DECL:
4266 case LABEL_DECL:
4267 case CONST_DECL:
4268 case RESULT_DECL:
4269 op0 = DECL_RTL_IF_SET (exp);
4271 /* This decl was probably optimized away. */
4272 if (!op0)
4274 if (!VAR_P (exp)
4275 || DECL_EXTERNAL (exp)
4276 || !TREE_STATIC (exp)
4277 || !DECL_NAME (exp)
4278 || DECL_HARD_REGISTER (exp)
4279 || DECL_IN_CONSTANT_POOL (exp)
4280 || mode == VOIDmode)
4281 return NULL;
4283 op0 = make_decl_rtl_for_debug (exp);
4284 if (!MEM_P (op0)
4285 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4286 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4287 return NULL;
4289 else
4290 op0 = copy_rtx (op0);
4292 if (GET_MODE (op0) == BLKmode
4293 /* If op0 is not BLKmode, but mode is, adjust_mode
4294 below would ICE. While it is likely a FE bug,
4295 try to be robust here. See PR43166. */
4296 || mode == BLKmode
4297 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4299 gcc_assert (MEM_P (op0));
4300 op0 = adjust_address_nv (op0, mode, 0);
4301 return op0;
4304 /* Fall through. */
4306 adjust_mode:
4307 case PAREN_EXPR:
4308 CASE_CONVERT:
4310 inner_mode = GET_MODE (op0);
4312 if (mode == inner_mode)
4313 return op0;
4315 if (inner_mode == VOIDmode)
4317 if (TREE_CODE (exp) == SSA_NAME)
4318 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4319 else
4320 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4321 if (mode == inner_mode)
4322 return op0;
4325 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4327 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
4328 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4329 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
4330 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4331 else
4332 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4334 else if (FLOAT_MODE_P (mode))
4336 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4337 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4338 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4339 else
4340 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4342 else if (FLOAT_MODE_P (inner_mode))
4344 if (unsignedp)
4345 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4346 else
4347 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4349 else if (CONSTANT_P (op0)
4350 || GET_MODE_PRECISION (mode) <= GET_MODE_PRECISION (inner_mode))
4351 op0 = lowpart_subreg (mode, op0, inner_mode);
4352 else if (UNARY_CLASS_P (exp)
4353 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4354 : unsignedp)
4355 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4356 else
4357 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4359 return op0;
4362 case MEM_REF:
4363 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4365 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4366 TREE_OPERAND (exp, 0),
4367 TREE_OPERAND (exp, 1));
4368 if (newexp)
4369 return expand_debug_expr (newexp);
4371 /* FALLTHROUGH */
4372 case INDIRECT_REF:
4373 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4374 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4375 if (!op0)
4376 return NULL;
4378 if (TREE_CODE (exp) == MEM_REF)
4380 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4381 || (GET_CODE (op0) == PLUS
4382 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4383 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4384 Instead just use get_inner_reference. */
4385 goto component_ref;
4387 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4388 if (!op1 || !CONST_INT_P (op1))
4389 return NULL;
4391 op0 = plus_constant (inner_mode, op0, INTVAL (op1));
4394 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4396 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4397 op0, as);
4398 if (op0 == NULL_RTX)
4399 return NULL;
4401 op0 = gen_rtx_MEM (mode, op0);
4402 set_mem_attributes (op0, exp, 0);
4403 if (TREE_CODE (exp) == MEM_REF
4404 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4405 set_mem_expr (op0, NULL_TREE);
4406 set_mem_addr_space (op0, as);
4408 return op0;
4410 case TARGET_MEM_REF:
4411 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4412 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4413 return NULL;
4415 op0 = expand_debug_expr
4416 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4417 if (!op0)
4418 return NULL;
4420 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4421 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4422 op0, as);
4423 if (op0 == NULL_RTX)
4424 return NULL;
4426 op0 = gen_rtx_MEM (mode, op0);
4428 set_mem_attributes (op0, exp, 0);
4429 set_mem_addr_space (op0, as);
4431 return op0;
4433 component_ref:
4434 case ARRAY_REF:
4435 case ARRAY_RANGE_REF:
4436 case COMPONENT_REF:
4437 case BIT_FIELD_REF:
4438 case REALPART_EXPR:
4439 case IMAGPART_EXPR:
4440 case VIEW_CONVERT_EXPR:
4442 machine_mode mode1;
4443 HOST_WIDE_INT bitsize, bitpos;
4444 tree offset;
4445 int reversep, volatilep = 0;
4446 tree tem
4447 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4448 &unsignedp, &reversep, &volatilep);
4449 rtx orig_op0;
4451 if (bitsize == 0)
4452 return NULL;
4454 orig_op0 = op0 = expand_debug_expr (tem);
4456 if (!op0)
4457 return NULL;
4459 if (offset)
4461 machine_mode addrmode, offmode;
4463 if (!MEM_P (op0))
4464 return NULL;
4466 op0 = XEXP (op0, 0);
4467 addrmode = GET_MODE (op0);
4468 if (addrmode == VOIDmode)
4469 addrmode = Pmode;
4471 op1 = expand_debug_expr (offset);
4472 if (!op1)
4473 return NULL;
4475 offmode = GET_MODE (op1);
4476 if (offmode == VOIDmode)
4477 offmode = TYPE_MODE (TREE_TYPE (offset));
4479 if (addrmode != offmode)
4480 op1 = lowpart_subreg (addrmode, op1, offmode);
4482 /* Don't use offset_address here, we don't need a
4483 recognizable address, and we don't want to generate
4484 code. */
4485 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4486 op0, op1));
4489 if (MEM_P (op0))
4491 if (mode1 == VOIDmode)
4492 /* Bitfield. */
4493 mode1 = smallest_mode_for_size (bitsize, MODE_INT);
4494 if (bitpos >= BITS_PER_UNIT)
4496 op0 = adjust_address_nv (op0, mode1, bitpos / BITS_PER_UNIT);
4497 bitpos %= BITS_PER_UNIT;
4499 else if (bitpos < 0)
4501 HOST_WIDE_INT units
4502 = (-bitpos + BITS_PER_UNIT - 1) / BITS_PER_UNIT;
4503 op0 = adjust_address_nv (op0, mode1, -units);
4504 bitpos += units * BITS_PER_UNIT;
4506 else if (bitpos == 0 && bitsize == GET_MODE_BITSIZE (mode))
4507 op0 = adjust_address_nv (op0, mode, 0);
4508 else if (GET_MODE (op0) != mode1)
4509 op0 = adjust_address_nv (op0, mode1, 0);
4510 else
4511 op0 = copy_rtx (op0);
4512 if (op0 == orig_op0)
4513 op0 = shallow_copy_rtx (op0);
4514 set_mem_attributes (op0, exp, 0);
4517 if (bitpos == 0 && mode == GET_MODE (op0))
4518 return op0;
4520 if (bitpos < 0)
4521 return NULL;
4523 if (GET_MODE (op0) == BLKmode)
4524 return NULL;
4526 if ((bitpos % BITS_PER_UNIT) == 0
4527 && bitsize == GET_MODE_BITSIZE (mode1))
4529 machine_mode opmode = GET_MODE (op0);
4531 if (opmode == VOIDmode)
4532 opmode = TYPE_MODE (TREE_TYPE (tem));
4534 /* This condition may hold if we're expanding the address
4535 right past the end of an array that turned out not to
4536 be addressable (i.e., the address was only computed in
4537 debug stmts). The gen_subreg below would rightfully
4538 crash, and the address doesn't really exist, so just
4539 drop it. */
4540 if (bitpos >= GET_MODE_BITSIZE (opmode))
4541 return NULL;
4543 if ((bitpos % GET_MODE_BITSIZE (mode)) == 0)
4544 return simplify_gen_subreg (mode, op0, opmode,
4545 bitpos / BITS_PER_UNIT);
4548 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4549 && TYPE_UNSIGNED (TREE_TYPE (exp))
4550 ? SIGN_EXTRACT
4551 : ZERO_EXTRACT, mode,
4552 GET_MODE (op0) != VOIDmode
4553 ? GET_MODE (op0)
4554 : TYPE_MODE (TREE_TYPE (tem)),
4555 op0, GEN_INT (bitsize), GEN_INT (bitpos));
4558 case ABS_EXPR:
4559 return simplify_gen_unary (ABS, mode, op0, mode);
4561 case NEGATE_EXPR:
4562 return simplify_gen_unary (NEG, mode, op0, mode);
4564 case BIT_NOT_EXPR:
4565 return simplify_gen_unary (NOT, mode, op0, mode);
4567 case FLOAT_EXPR:
4568 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4569 0)))
4570 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4571 inner_mode);
4573 case FIX_TRUNC_EXPR:
4574 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4575 inner_mode);
4577 case POINTER_PLUS_EXPR:
4578 /* For the rare target where pointers are not the same size as
4579 size_t, we need to check for mis-matched modes and correct
4580 the addend. */
4581 if (op0 && op1
4582 && GET_MODE (op0) != VOIDmode && GET_MODE (op1) != VOIDmode
4583 && GET_MODE (op0) != GET_MODE (op1))
4585 if (GET_MODE_BITSIZE (GET_MODE (op0)) < GET_MODE_BITSIZE (GET_MODE (op1))
4586 /* If OP0 is a partial mode, then we must truncate, even if it has
4587 the same bitsize as OP1 as GCC's representation of partial modes
4588 is opaque. */
4589 || (GET_MODE_CLASS (GET_MODE (op0)) == MODE_PARTIAL_INT
4590 && GET_MODE_BITSIZE (GET_MODE (op0)) == GET_MODE_BITSIZE (GET_MODE (op1))))
4591 op1 = simplify_gen_unary (TRUNCATE, GET_MODE (op0), op1,
4592 GET_MODE (op1));
4593 else
4594 /* We always sign-extend, regardless of the signedness of
4595 the operand, because the operand is always unsigned
4596 here even if the original C expression is signed. */
4597 op1 = simplify_gen_unary (SIGN_EXTEND, GET_MODE (op0), op1,
4598 GET_MODE (op1));
4600 /* Fall through. */
4601 case PLUS_EXPR:
4602 return simplify_gen_binary (PLUS, mode, op0, op1);
4604 case MINUS_EXPR:
4605 return simplify_gen_binary (MINUS, mode, op0, op1);
4607 case MULT_EXPR:
4608 return simplify_gen_binary (MULT, mode, op0, op1);
4610 case RDIV_EXPR:
4611 case TRUNC_DIV_EXPR:
4612 case EXACT_DIV_EXPR:
4613 if (unsignedp)
4614 return simplify_gen_binary (UDIV, mode, op0, op1);
4615 else
4616 return simplify_gen_binary (DIV, mode, op0, op1);
4618 case TRUNC_MOD_EXPR:
4619 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4621 case FLOOR_DIV_EXPR:
4622 if (unsignedp)
4623 return simplify_gen_binary (UDIV, mode, op0, op1);
4624 else
4626 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4627 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4628 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4629 return simplify_gen_binary (PLUS, mode, div, adj);
4632 case FLOOR_MOD_EXPR:
4633 if (unsignedp)
4634 return simplify_gen_binary (UMOD, mode, op0, op1);
4635 else
4637 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4638 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4639 adj = simplify_gen_unary (NEG, mode,
4640 simplify_gen_binary (MULT, mode, adj, op1),
4641 mode);
4642 return simplify_gen_binary (PLUS, mode, mod, adj);
4645 case CEIL_DIV_EXPR:
4646 if (unsignedp)
4648 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4649 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4650 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4651 return simplify_gen_binary (PLUS, mode, div, adj);
4653 else
4655 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4656 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4657 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4658 return simplify_gen_binary (PLUS, mode, div, adj);
4661 case CEIL_MOD_EXPR:
4662 if (unsignedp)
4664 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4665 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4666 adj = simplify_gen_unary (NEG, mode,
4667 simplify_gen_binary (MULT, mode, adj, op1),
4668 mode);
4669 return simplify_gen_binary (PLUS, mode, mod, adj);
4671 else
4673 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4674 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4675 adj = simplify_gen_unary (NEG, mode,
4676 simplify_gen_binary (MULT, mode, adj, op1),
4677 mode);
4678 return simplify_gen_binary (PLUS, mode, mod, adj);
4681 case ROUND_DIV_EXPR:
4682 if (unsignedp)
4684 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4685 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4686 rtx adj = round_udiv_adjust (mode, mod, op1);
4687 return simplify_gen_binary (PLUS, mode, div, adj);
4689 else
4691 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4692 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4693 rtx adj = round_sdiv_adjust (mode, mod, op1);
4694 return simplify_gen_binary (PLUS, mode, div, adj);
4697 case ROUND_MOD_EXPR:
4698 if (unsignedp)
4700 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4701 rtx adj = round_udiv_adjust (mode, mod, op1);
4702 adj = simplify_gen_unary (NEG, mode,
4703 simplify_gen_binary (MULT, mode, adj, op1),
4704 mode);
4705 return simplify_gen_binary (PLUS, mode, mod, adj);
4707 else
4709 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4710 rtx adj = round_sdiv_adjust (mode, mod, op1);
4711 adj = simplify_gen_unary (NEG, mode,
4712 simplify_gen_binary (MULT, mode, adj, op1),
4713 mode);
4714 return simplify_gen_binary (PLUS, mode, mod, adj);
4717 case LSHIFT_EXPR:
4718 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4720 case RSHIFT_EXPR:
4721 if (unsignedp)
4722 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4723 else
4724 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4726 case LROTATE_EXPR:
4727 return simplify_gen_binary (ROTATE, mode, op0, op1);
4729 case RROTATE_EXPR:
4730 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4732 case MIN_EXPR:
4733 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4735 case MAX_EXPR:
4736 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4738 case BIT_AND_EXPR:
4739 case TRUTH_AND_EXPR:
4740 return simplify_gen_binary (AND, mode, op0, op1);
4742 case BIT_IOR_EXPR:
4743 case TRUTH_OR_EXPR:
4744 return simplify_gen_binary (IOR, mode, op0, op1);
4746 case BIT_XOR_EXPR:
4747 case TRUTH_XOR_EXPR:
4748 return simplify_gen_binary (XOR, mode, op0, op1);
4750 case TRUTH_ANDIF_EXPR:
4751 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4753 case TRUTH_ORIF_EXPR:
4754 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4756 case TRUTH_NOT_EXPR:
4757 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4759 case LT_EXPR:
4760 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4761 op0, op1);
4763 case LE_EXPR:
4764 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4765 op0, op1);
4767 case GT_EXPR:
4768 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4769 op0, op1);
4771 case GE_EXPR:
4772 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4773 op0, op1);
4775 case EQ_EXPR:
4776 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4778 case NE_EXPR:
4779 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4781 case UNORDERED_EXPR:
4782 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4784 case ORDERED_EXPR:
4785 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4787 case UNLT_EXPR:
4788 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4790 case UNLE_EXPR:
4791 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4793 case UNGT_EXPR:
4794 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4796 case UNGE_EXPR:
4797 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4799 case UNEQ_EXPR:
4800 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4802 case LTGT_EXPR:
4803 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4805 case COND_EXPR:
4806 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4808 case COMPLEX_EXPR:
4809 gcc_assert (COMPLEX_MODE_P (mode));
4810 if (GET_MODE (op0) == VOIDmode)
4811 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4812 if (GET_MODE (op1) == VOIDmode)
4813 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4814 return gen_rtx_CONCAT (mode, op0, op1);
4816 case CONJ_EXPR:
4817 if (GET_CODE (op0) == CONCAT)
4818 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4819 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4820 XEXP (op0, 1),
4821 GET_MODE_INNER (mode)));
4822 else
4824 machine_mode imode = GET_MODE_INNER (mode);
4825 rtx re, im;
4827 if (MEM_P (op0))
4829 re = adjust_address_nv (op0, imode, 0);
4830 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4832 else
4834 machine_mode ifmode = int_mode_for_mode (mode);
4835 machine_mode ihmode = int_mode_for_mode (imode);
4836 rtx halfsize;
4837 if (ifmode == BLKmode || ihmode == BLKmode)
4838 return NULL;
4839 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4840 re = op0;
4841 if (mode != ifmode)
4842 re = gen_rtx_SUBREG (ifmode, re, 0);
4843 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4844 if (imode != ihmode)
4845 re = gen_rtx_SUBREG (imode, re, 0);
4846 im = copy_rtx (op0);
4847 if (mode != ifmode)
4848 im = gen_rtx_SUBREG (ifmode, im, 0);
4849 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4850 if (imode != ihmode)
4851 im = gen_rtx_SUBREG (imode, im, 0);
4853 im = gen_rtx_NEG (imode, im);
4854 return gen_rtx_CONCAT (mode, re, im);
4857 case ADDR_EXPR:
4858 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4859 if (!op0 || !MEM_P (op0))
4861 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
4862 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
4863 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
4864 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
4865 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
4866 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
4868 if (handled_component_p (TREE_OPERAND (exp, 0)))
4870 HOST_WIDE_INT bitoffset, bitsize, maxsize;
4871 bool reverse;
4872 tree decl
4873 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
4874 &bitsize, &maxsize, &reverse);
4875 if ((VAR_P (decl)
4876 || TREE_CODE (decl) == PARM_DECL
4877 || TREE_CODE (decl) == RESULT_DECL)
4878 && (!TREE_ADDRESSABLE (decl)
4879 || target_for_debug_bind (decl))
4880 && (bitoffset % BITS_PER_UNIT) == 0
4881 && bitsize > 0
4882 && bitsize == maxsize)
4884 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
4885 return plus_constant (mode, base, bitoffset / BITS_PER_UNIT);
4889 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
4890 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
4891 == ADDR_EXPR)
4893 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4894 0));
4895 if (op0 != NULL
4896 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4897 || (GET_CODE (op0) == PLUS
4898 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
4899 && CONST_INT_P (XEXP (op0, 1)))))
4901 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4902 1));
4903 if (!op1 || !CONST_INT_P (op1))
4904 return NULL;
4906 return plus_constant (mode, op0, INTVAL (op1));
4910 return NULL;
4913 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
4914 op0 = convert_debug_memory_address (mode, XEXP (op0, 0), as);
4916 return op0;
4918 case VECTOR_CST:
4920 unsigned i;
4922 op0 = gen_rtx_CONCATN
4923 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4925 for (i = 0; i < VECTOR_CST_NELTS (exp); ++i)
4927 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
4928 if (!op1)
4929 return NULL;
4930 XVECEXP (op0, 0, i) = op1;
4933 return op0;
4936 case CONSTRUCTOR:
4937 if (TREE_CLOBBER_P (exp))
4938 return NULL;
4939 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
4941 unsigned i;
4942 tree val;
4944 op0 = gen_rtx_CONCATN
4945 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4947 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
4949 op1 = expand_debug_expr (val);
4950 if (!op1)
4951 return NULL;
4952 XVECEXP (op0, 0, i) = op1;
4955 if (i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)))
4957 op1 = expand_debug_expr
4958 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
4960 if (!op1)
4961 return NULL;
4963 for (; i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)); i++)
4964 XVECEXP (op0, 0, i) = op1;
4967 return op0;
4969 else
4970 goto flag_unsupported;
4972 case CALL_EXPR:
4973 /* ??? Maybe handle some builtins? */
4974 return NULL;
4976 case SSA_NAME:
4978 gimple *g = get_gimple_for_ssa_name (exp);
4979 if (g)
4981 tree t = NULL_TREE;
4982 if (deep_ter_debug_map)
4984 tree *slot = deep_ter_debug_map->get (exp);
4985 if (slot)
4986 t = *slot;
4988 if (t == NULL_TREE)
4989 t = gimple_assign_rhs_to_tree (g);
4990 op0 = expand_debug_expr (t);
4991 if (!op0)
4992 return NULL;
4994 else
4996 /* If this is a reference to an incoming value of
4997 parameter that is never used in the code or where the
4998 incoming value is never used in the code, use
4999 PARM_DECL's DECL_RTL if set. */
5000 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5001 && SSA_NAME_VAR (exp)
5002 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5003 && has_zero_uses (exp))
5005 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5006 if (op0)
5007 goto adjust_mode;
5008 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5009 if (op0)
5010 goto adjust_mode;
5013 int part = var_to_partition (SA.map, exp);
5015 if (part == NO_PARTITION)
5016 return NULL;
5018 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5020 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5022 goto adjust_mode;
5025 case ERROR_MARK:
5026 return NULL;
5028 /* Vector stuff. For most of the codes we don't have rtl codes. */
5029 case REALIGN_LOAD_EXPR:
5030 case REDUC_MAX_EXPR:
5031 case REDUC_MIN_EXPR:
5032 case REDUC_PLUS_EXPR:
5033 case VEC_COND_EXPR:
5034 case VEC_PACK_FIX_TRUNC_EXPR:
5035 case VEC_PACK_SAT_EXPR:
5036 case VEC_PACK_TRUNC_EXPR:
5037 case VEC_UNPACK_FLOAT_HI_EXPR:
5038 case VEC_UNPACK_FLOAT_LO_EXPR:
5039 case VEC_UNPACK_HI_EXPR:
5040 case VEC_UNPACK_LO_EXPR:
5041 case VEC_WIDEN_MULT_HI_EXPR:
5042 case VEC_WIDEN_MULT_LO_EXPR:
5043 case VEC_WIDEN_MULT_EVEN_EXPR:
5044 case VEC_WIDEN_MULT_ODD_EXPR:
5045 case VEC_WIDEN_LSHIFT_HI_EXPR:
5046 case VEC_WIDEN_LSHIFT_LO_EXPR:
5047 case VEC_PERM_EXPR:
5048 return NULL;
5050 /* Misc codes. */
5051 case ADDR_SPACE_CONVERT_EXPR:
5052 case FIXED_CONVERT_EXPR:
5053 case OBJ_TYPE_REF:
5054 case WITH_SIZE_EXPR:
5055 case BIT_INSERT_EXPR:
5056 return NULL;
5058 case DOT_PROD_EXPR:
5059 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5060 && SCALAR_INT_MODE_P (mode))
5063 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5064 0)))
5065 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5066 inner_mode);
5068 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5069 1)))
5070 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5071 inner_mode);
5072 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5073 return simplify_gen_binary (PLUS, mode, op0, op2);
5075 return NULL;
5077 case WIDEN_MULT_EXPR:
5078 case WIDEN_MULT_PLUS_EXPR:
5079 case WIDEN_MULT_MINUS_EXPR:
5080 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5081 && SCALAR_INT_MODE_P (mode))
5083 inner_mode = GET_MODE (op0);
5084 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5085 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5086 else
5087 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5088 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5089 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5090 else
5091 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5092 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5093 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5094 return op0;
5095 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5096 return simplify_gen_binary (PLUS, mode, op0, op2);
5097 else
5098 return simplify_gen_binary (MINUS, mode, op2, op0);
5100 return NULL;
5102 case MULT_HIGHPART_EXPR:
5103 /* ??? Similar to the above. */
5104 return NULL;
5106 case WIDEN_SUM_EXPR:
5107 case WIDEN_LSHIFT_EXPR:
5108 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5109 && SCALAR_INT_MODE_P (mode))
5112 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5113 0)))
5114 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5115 inner_mode);
5116 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5117 ? ASHIFT : PLUS, mode, op0, op1);
5119 return NULL;
5121 case FMA_EXPR:
5122 return simplify_gen_ternary (FMA, mode, inner_mode, op0, op1, op2);
5124 default:
5125 flag_unsupported:
5126 if (flag_checking)
5128 debug_tree (exp);
5129 gcc_unreachable ();
5131 return NULL;
5135 /* Return an RTX equivalent to the source bind value of the tree expression
5136 EXP. */
5138 static rtx
5139 expand_debug_source_expr (tree exp)
5141 rtx op0 = NULL_RTX;
5142 machine_mode mode = VOIDmode, inner_mode;
5144 switch (TREE_CODE (exp))
5146 case PARM_DECL:
5148 mode = DECL_MODE (exp);
5149 op0 = expand_debug_parm_decl (exp);
5150 if (op0)
5151 break;
5152 /* See if this isn't an argument that has been completely
5153 optimized out. */
5154 if (!DECL_RTL_SET_P (exp)
5155 && !DECL_INCOMING_RTL (exp)
5156 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5158 tree aexp = DECL_ORIGIN (exp);
5159 if (DECL_CONTEXT (aexp)
5160 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5162 vec<tree, va_gc> **debug_args;
5163 unsigned int ix;
5164 tree ddecl;
5165 debug_args = decl_debug_args_lookup (current_function_decl);
5166 if (debug_args != NULL)
5168 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5169 ix += 2)
5170 if (ddecl == aexp)
5171 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5175 break;
5177 default:
5178 break;
5181 if (op0 == NULL_RTX)
5182 return NULL_RTX;
5184 inner_mode = GET_MODE (op0);
5185 if (mode == inner_mode)
5186 return op0;
5188 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5190 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
5191 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5192 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
5193 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5194 else
5195 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5197 else if (FLOAT_MODE_P (mode))
5198 gcc_unreachable ();
5199 else if (FLOAT_MODE_P (inner_mode))
5201 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5202 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5203 else
5204 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5206 else if (CONSTANT_P (op0)
5207 || GET_MODE_BITSIZE (mode) <= GET_MODE_BITSIZE (inner_mode))
5208 op0 = lowpart_subreg (mode, op0, inner_mode);
5209 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5210 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5211 else
5212 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5214 return op0;
5217 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5218 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5219 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5221 static void
5222 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5224 rtx exp = *exp_p;
5226 if (exp == NULL_RTX)
5227 return;
5229 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5230 return;
5232 if (depth == 4)
5234 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5235 rtx dval = make_debug_expr_from_rtl (exp);
5237 /* Emit a debug bind insn before INSN. */
5238 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5239 DEBUG_EXPR_TREE_DECL (dval), exp,
5240 VAR_INIT_STATUS_INITIALIZED);
5242 emit_debug_insn_before (bind, insn);
5243 *exp_p = dval;
5244 return;
5247 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5248 int i, j;
5249 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5250 switch (*format_ptr++)
5252 case 'e':
5253 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5254 break;
5256 case 'E':
5257 case 'V':
5258 for (j = 0; j < XVECLEN (exp, i); j++)
5259 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5260 break;
5262 default:
5263 break;
5267 /* Expand the _LOCs in debug insns. We run this after expanding all
5268 regular insns, so that any variables referenced in the function
5269 will have their DECL_RTLs set. */
5271 static void
5272 expand_debug_locations (void)
5274 rtx_insn *insn;
5275 rtx_insn *last = get_last_insn ();
5276 int save_strict_alias = flag_strict_aliasing;
5278 /* New alias sets while setting up memory attributes cause
5279 -fcompare-debug failures, even though it doesn't bring about any
5280 codegen changes. */
5281 flag_strict_aliasing = 0;
5283 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5284 if (DEBUG_INSN_P (insn))
5286 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5287 rtx val;
5288 rtx_insn *prev_insn, *insn2;
5289 machine_mode mode;
5291 if (value == NULL_TREE)
5292 val = NULL_RTX;
5293 else
5295 if (INSN_VAR_LOCATION_STATUS (insn)
5296 == VAR_INIT_STATUS_UNINITIALIZED)
5297 val = expand_debug_source_expr (value);
5298 /* The avoid_deep_ter_for_debug function inserts
5299 debug bind stmts after SSA_NAME definition, with the
5300 SSA_NAME as the whole bind location. Disable temporarily
5301 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5302 being defined in this DEBUG_INSN. */
5303 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5305 tree *slot = deep_ter_debug_map->get (value);
5306 if (slot)
5308 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5309 *slot = NULL_TREE;
5310 else
5311 slot = NULL;
5313 val = expand_debug_expr (value);
5314 if (slot)
5315 *slot = INSN_VAR_LOCATION_DECL (insn);
5317 else
5318 val = expand_debug_expr (value);
5319 gcc_assert (last == get_last_insn ());
5322 if (!val)
5323 val = gen_rtx_UNKNOWN_VAR_LOC ();
5324 else
5326 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5328 gcc_assert (mode == GET_MODE (val)
5329 || (GET_MODE (val) == VOIDmode
5330 && (CONST_SCALAR_INT_P (val)
5331 || GET_CODE (val) == CONST_FIXED
5332 || GET_CODE (val) == LABEL_REF)));
5335 INSN_VAR_LOCATION_LOC (insn) = val;
5336 prev_insn = PREV_INSN (insn);
5337 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5338 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5341 flag_strict_aliasing = save_strict_alias;
5344 /* Performs swapping operands of commutative operations to expand
5345 the expensive one first. */
5347 static void
5348 reorder_operands (basic_block bb)
5350 unsigned int *lattice; /* Hold cost of each statement. */
5351 unsigned int i = 0, n = 0;
5352 gimple_stmt_iterator gsi;
5353 gimple_seq stmts;
5354 gimple *stmt;
5355 bool swap;
5356 tree op0, op1;
5357 ssa_op_iter iter;
5358 use_operand_p use_p;
5359 gimple *def0, *def1;
5361 /* Compute cost of each statement using estimate_num_insns. */
5362 stmts = bb_seq (bb);
5363 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5365 stmt = gsi_stmt (gsi);
5366 if (!is_gimple_debug (stmt))
5367 gimple_set_uid (stmt, n++);
5369 lattice = XNEWVEC (unsigned int, n);
5370 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5372 unsigned cost;
5373 stmt = gsi_stmt (gsi);
5374 if (is_gimple_debug (stmt))
5375 continue;
5376 cost = estimate_num_insns (stmt, &eni_size_weights);
5377 lattice[i] = cost;
5378 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5380 tree use = USE_FROM_PTR (use_p);
5381 gimple *def_stmt;
5382 if (TREE_CODE (use) != SSA_NAME)
5383 continue;
5384 def_stmt = get_gimple_for_ssa_name (use);
5385 if (!def_stmt)
5386 continue;
5387 lattice[i] += lattice[gimple_uid (def_stmt)];
5389 i++;
5390 if (!is_gimple_assign (stmt)
5391 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5392 continue;
5393 op0 = gimple_op (stmt, 1);
5394 op1 = gimple_op (stmt, 2);
5395 if (TREE_CODE (op0) != SSA_NAME
5396 || TREE_CODE (op1) != SSA_NAME)
5397 continue;
5398 /* Swap operands if the second one is more expensive. */
5399 def0 = get_gimple_for_ssa_name (op0);
5400 def1 = get_gimple_for_ssa_name (op1);
5401 if (!def1)
5402 continue;
5403 swap = false;
5404 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5405 swap = true;
5406 if (swap)
5408 if (dump_file && (dump_flags & TDF_DETAILS))
5410 fprintf (dump_file, "Swap operands in stmt:\n");
5411 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5412 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5413 def0 ? lattice[gimple_uid (def0)] : 0,
5414 lattice[gimple_uid (def1)]);
5416 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5417 gimple_assign_rhs2_ptr (stmt));
5420 XDELETE (lattice);
5423 /* Expand basic block BB from GIMPLE trees to RTL. */
5425 static basic_block
5426 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5428 gimple_stmt_iterator gsi;
5429 gimple_seq stmts;
5430 gimple *stmt = NULL;
5431 rtx_note *note;
5432 rtx_insn *last;
5433 edge e;
5434 edge_iterator ei;
5436 if (dump_file)
5437 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5438 bb->index);
5440 /* Note that since we are now transitioning from GIMPLE to RTL, we
5441 cannot use the gsi_*_bb() routines because they expect the basic
5442 block to be in GIMPLE, instead of RTL. Therefore, we need to
5443 access the BB sequence directly. */
5444 if (optimize)
5445 reorder_operands (bb);
5446 stmts = bb_seq (bb);
5447 bb->il.gimple.seq = NULL;
5448 bb->il.gimple.phi_nodes = NULL;
5449 rtl_profile_for_bb (bb);
5450 init_rtl_bb_info (bb);
5451 bb->flags |= BB_RTL;
5453 /* Remove the RETURN_EXPR if we may fall though to the exit
5454 instead. */
5455 gsi = gsi_last (stmts);
5456 if (!gsi_end_p (gsi)
5457 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5459 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5461 gcc_assert (single_succ_p (bb));
5462 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5464 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5465 && !gimple_return_retval (ret_stmt))
5467 gsi_remove (&gsi, false);
5468 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5472 gsi = gsi_start (stmts);
5473 if (!gsi_end_p (gsi))
5475 stmt = gsi_stmt (gsi);
5476 if (gimple_code (stmt) != GIMPLE_LABEL)
5477 stmt = NULL;
5480 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5482 if (stmt || elt)
5484 last = get_last_insn ();
5486 if (stmt)
5488 expand_gimple_stmt (stmt);
5489 gsi_next (&gsi);
5492 if (elt)
5493 emit_label (*elt);
5495 /* Java emits line number notes in the top of labels.
5496 ??? Make this go away once line number notes are obsoleted. */
5497 BB_HEAD (bb) = NEXT_INSN (last);
5498 if (NOTE_P (BB_HEAD (bb)))
5499 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5500 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5502 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5504 else
5505 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5507 NOTE_BASIC_BLOCK (note) = bb;
5509 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5511 basic_block new_bb;
5513 stmt = gsi_stmt (gsi);
5515 /* If this statement is a non-debug one, and we generate debug
5516 insns, then this one might be the last real use of a TERed
5517 SSA_NAME, but where there are still some debug uses further
5518 down. Expanding the current SSA name in such further debug
5519 uses by their RHS might lead to wrong debug info, as coalescing
5520 might make the operands of such RHS be placed into the same
5521 pseudo as something else. Like so:
5522 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5523 use(a_1);
5524 a_2 = ...
5525 #DEBUG ... => a_1
5526 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5527 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5528 the write to a_2 would actually have clobbered the place which
5529 formerly held a_0.
5531 So, instead of that, we recognize the situation, and generate
5532 debug temporaries at the last real use of TERed SSA names:
5533 a_1 = a_0 + 1;
5534 #DEBUG #D1 => a_1
5535 use(a_1);
5536 a_2 = ...
5537 #DEBUG ... => #D1
5539 if (MAY_HAVE_DEBUG_INSNS
5540 && SA.values
5541 && !is_gimple_debug (stmt))
5543 ssa_op_iter iter;
5544 tree op;
5545 gimple *def;
5547 location_t sloc = curr_insn_location ();
5549 /* Look for SSA names that have their last use here (TERed
5550 names always have only one real use). */
5551 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5552 if ((def = get_gimple_for_ssa_name (op)))
5554 imm_use_iterator imm_iter;
5555 use_operand_p use_p;
5556 bool have_debug_uses = false;
5558 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5560 if (gimple_debug_bind_p (USE_STMT (use_p)))
5562 have_debug_uses = true;
5563 break;
5567 if (have_debug_uses)
5569 /* OP is a TERed SSA name, with DEF its defining
5570 statement, and where OP is used in further debug
5571 instructions. Generate a debug temporary, and
5572 replace all uses of OP in debug insns with that
5573 temporary. */
5574 gimple *debugstmt;
5575 tree value = gimple_assign_rhs_to_tree (def);
5576 tree vexpr = make_node (DEBUG_EXPR_DECL);
5577 rtx val;
5578 machine_mode mode;
5580 set_curr_insn_location (gimple_location (def));
5582 DECL_ARTIFICIAL (vexpr) = 1;
5583 TREE_TYPE (vexpr) = TREE_TYPE (value);
5584 if (DECL_P (value))
5585 mode = DECL_MODE (value);
5586 else
5587 mode = TYPE_MODE (TREE_TYPE (value));
5588 SET_DECL_MODE (vexpr, mode);
5590 val = gen_rtx_VAR_LOCATION
5591 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5593 emit_debug_insn (val);
5595 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5597 if (!gimple_debug_bind_p (debugstmt))
5598 continue;
5600 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5601 SET_USE (use_p, vexpr);
5603 update_stmt (debugstmt);
5607 set_curr_insn_location (sloc);
5610 currently_expanding_gimple_stmt = stmt;
5612 /* Expand this statement, then evaluate the resulting RTL and
5613 fixup the CFG accordingly. */
5614 if (gimple_code (stmt) == GIMPLE_COND)
5616 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5617 if (new_bb)
5618 return new_bb;
5620 else if (gimple_debug_bind_p (stmt))
5622 location_t sloc = curr_insn_location ();
5623 gimple_stmt_iterator nsi = gsi;
5625 for (;;)
5627 tree var = gimple_debug_bind_get_var (stmt);
5628 tree value;
5629 rtx val;
5630 machine_mode mode;
5632 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5633 && TREE_CODE (var) != LABEL_DECL
5634 && !target_for_debug_bind (var))
5635 goto delink_debug_stmt;
5637 if (gimple_debug_bind_has_value_p (stmt))
5638 value = gimple_debug_bind_get_value (stmt);
5639 else
5640 value = NULL_TREE;
5642 last = get_last_insn ();
5644 set_curr_insn_location (gimple_location (stmt));
5646 if (DECL_P (var))
5647 mode = DECL_MODE (var);
5648 else
5649 mode = TYPE_MODE (TREE_TYPE (var));
5651 val = gen_rtx_VAR_LOCATION
5652 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5654 emit_debug_insn (val);
5656 if (dump_file && (dump_flags & TDF_DETAILS))
5658 /* We can't dump the insn with a TREE where an RTX
5659 is expected. */
5660 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5661 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5662 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5665 delink_debug_stmt:
5666 /* In order not to generate too many debug temporaries,
5667 we delink all uses of debug statements we already expanded.
5668 Therefore debug statements between definition and real
5669 use of TERed SSA names will continue to use the SSA name,
5670 and not be replaced with debug temps. */
5671 delink_stmt_imm_use (stmt);
5673 gsi = nsi;
5674 gsi_next (&nsi);
5675 if (gsi_end_p (nsi))
5676 break;
5677 stmt = gsi_stmt (nsi);
5678 if (!gimple_debug_bind_p (stmt))
5679 break;
5682 set_curr_insn_location (sloc);
5684 else if (gimple_debug_source_bind_p (stmt))
5686 location_t sloc = curr_insn_location ();
5687 tree var = gimple_debug_source_bind_get_var (stmt);
5688 tree value = gimple_debug_source_bind_get_value (stmt);
5689 rtx val;
5690 machine_mode mode;
5692 last = get_last_insn ();
5694 set_curr_insn_location (gimple_location (stmt));
5696 mode = DECL_MODE (var);
5698 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5699 VAR_INIT_STATUS_UNINITIALIZED);
5701 emit_debug_insn (val);
5703 if (dump_file && (dump_flags & TDF_DETAILS))
5705 /* We can't dump the insn with a TREE where an RTX
5706 is expected. */
5707 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5708 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5709 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5712 set_curr_insn_location (sloc);
5714 else
5716 gcall *call_stmt = dyn_cast <gcall *> (stmt);
5717 if (call_stmt
5718 && gimple_call_tail_p (call_stmt)
5719 && disable_tail_calls)
5720 gimple_call_set_tail (call_stmt, false);
5722 if (call_stmt && gimple_call_tail_p (call_stmt))
5724 bool can_fallthru;
5725 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
5726 if (new_bb)
5728 if (can_fallthru)
5729 bb = new_bb;
5730 else
5731 return new_bb;
5734 else
5736 def_operand_p def_p;
5737 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5739 if (def_p != NULL)
5741 /* Ignore this stmt if it is in the list of
5742 replaceable expressions. */
5743 if (SA.values
5744 && bitmap_bit_p (SA.values,
5745 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5746 continue;
5748 last = expand_gimple_stmt (stmt);
5749 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5754 currently_expanding_gimple_stmt = NULL;
5756 /* Expand implicit goto and convert goto_locus. */
5757 FOR_EACH_EDGE (e, ei, bb->succs)
5759 if (e->goto_locus != UNKNOWN_LOCATION)
5760 set_curr_insn_location (e->goto_locus);
5761 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5763 emit_jump (label_rtx_for_bb (e->dest));
5764 e->flags &= ~EDGE_FALLTHRU;
5768 /* Expanded RTL can create a jump in the last instruction of block.
5769 This later might be assumed to be a jump to successor and break edge insertion.
5770 We need to insert dummy move to prevent this. PR41440. */
5771 if (single_succ_p (bb)
5772 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5773 && (last = get_last_insn ())
5774 && (JUMP_P (last)
5775 || (DEBUG_INSN_P (last)
5776 && JUMP_P (prev_nondebug_insn (last)))))
5778 rtx dummy = gen_reg_rtx (SImode);
5779 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5782 do_pending_stack_adjust ();
5784 /* Find the block tail. The last insn in the block is the insn
5785 before a barrier and/or table jump insn. */
5786 last = get_last_insn ();
5787 if (BARRIER_P (last))
5788 last = PREV_INSN (last);
5789 if (JUMP_TABLE_DATA_P (last))
5790 last = PREV_INSN (PREV_INSN (last));
5791 BB_END (bb) = last;
5793 update_bb_for_insn (bb);
5795 return bb;
5799 /* Create a basic block for initialization code. */
5801 static basic_block
5802 construct_init_block (void)
5804 basic_block init_block, first_block;
5805 edge e = NULL;
5806 int flags;
5808 /* Multiple entry points not supported yet. */
5809 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5810 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5811 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5812 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5813 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5815 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5817 /* When entry edge points to first basic block, we don't need jump,
5818 otherwise we have to jump into proper target. */
5819 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5821 tree label = gimple_block_label (e->dest);
5823 emit_jump (jump_target_rtx (label));
5824 flags = 0;
5826 else
5827 flags = EDGE_FALLTHRU;
5829 init_block = create_basic_block (NEXT_INSN (get_insns ()),
5830 get_last_insn (),
5831 ENTRY_BLOCK_PTR_FOR_FN (cfun));
5832 init_block->frequency = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency;
5833 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5834 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5835 if (e)
5837 first_block = e->dest;
5838 redirect_edge_succ (e, init_block);
5839 e = make_single_succ_edge (init_block, first_block, flags);
5841 else
5842 e = make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5843 EDGE_FALLTHRU);
5845 update_bb_for_insn (init_block);
5846 return init_block;
5849 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
5850 found in the block tree. */
5852 static void
5853 set_block_levels (tree block, int level)
5855 while (block)
5857 BLOCK_NUMBER (block) = level;
5858 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
5859 block = BLOCK_CHAIN (block);
5863 /* Create a block containing landing pads and similar stuff. */
5865 static void
5866 construct_exit_block (void)
5868 rtx_insn *head = get_last_insn ();
5869 rtx_insn *end;
5870 basic_block exit_block;
5871 edge e, e2;
5872 unsigned ix;
5873 edge_iterator ei;
5874 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
5875 rtx_insn *orig_end = BB_END (prev_bb);
5877 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5879 /* Make sure the locus is set to the end of the function, so that
5880 epilogue line numbers and warnings are set properly. */
5881 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
5882 input_location = cfun->function_end_locus;
5884 /* Generate rtl for function exit. */
5885 expand_function_end ();
5887 end = get_last_insn ();
5888 if (head == end)
5889 return;
5890 /* While emitting the function end we could move end of the last basic
5891 block. */
5892 BB_END (prev_bb) = orig_end;
5893 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
5894 head = NEXT_INSN (head);
5895 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
5896 bb frequency counting will be confused. Any instructions before that
5897 label are emitted for the case where PREV_BB falls through into the
5898 exit block, so append those instructions to prev_bb in that case. */
5899 if (NEXT_INSN (head) != return_label)
5901 while (NEXT_INSN (head) != return_label)
5903 if (!NOTE_P (NEXT_INSN (head)))
5904 BB_END (prev_bb) = NEXT_INSN (head);
5905 head = NEXT_INSN (head);
5908 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
5909 exit_block->frequency = EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency;
5910 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5911 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5913 ix = 0;
5914 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
5916 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
5917 if (!(e->flags & EDGE_ABNORMAL))
5918 redirect_edge_succ (e, exit_block);
5919 else
5920 ix++;
5923 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5924 EDGE_FALLTHRU);
5925 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
5926 if (e2 != e)
5928 e->count -= e2->count;
5929 exit_block->count -= e2->count;
5930 exit_block->frequency -= EDGE_FREQUENCY (e2);
5932 if (exit_block->frequency < 0)
5933 exit_block->frequency = 0;
5934 update_bb_for_insn (exit_block);
5937 /* Helper function for discover_nonconstant_array_refs.
5938 Look for ARRAY_REF nodes with non-constant indexes and mark them
5939 addressable. */
5941 static tree
5942 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
5943 void *data ATTRIBUTE_UNUSED)
5945 tree t = *tp;
5947 if (IS_TYPE_OR_DECL_P (t))
5948 *walk_subtrees = 0;
5949 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5951 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5952 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
5953 && (!TREE_OPERAND (t, 2)
5954 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5955 || (TREE_CODE (t) == COMPONENT_REF
5956 && (!TREE_OPERAND (t,2)
5957 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5958 || TREE_CODE (t) == BIT_FIELD_REF
5959 || TREE_CODE (t) == REALPART_EXPR
5960 || TREE_CODE (t) == IMAGPART_EXPR
5961 || TREE_CODE (t) == VIEW_CONVERT_EXPR
5962 || CONVERT_EXPR_P (t))
5963 t = TREE_OPERAND (t, 0);
5965 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5967 t = get_base_address (t);
5968 if (t && DECL_P (t)
5969 && DECL_MODE (t) != BLKmode)
5970 TREE_ADDRESSABLE (t) = 1;
5973 *walk_subtrees = 0;
5976 return NULL_TREE;
5979 /* RTL expansion is not able to compile array references with variable
5980 offsets for arrays stored in single register. Discover such
5981 expressions and mark variables as addressable to avoid this
5982 scenario. */
5984 static void
5985 discover_nonconstant_array_refs (void)
5987 basic_block bb;
5988 gimple_stmt_iterator gsi;
5990 FOR_EACH_BB_FN (bb, cfun)
5991 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
5993 gimple *stmt = gsi_stmt (gsi);
5994 if (!is_gimple_debug (stmt))
5995 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
5999 /* This function sets crtl->args.internal_arg_pointer to a virtual
6000 register if DRAP is needed. Local register allocator will replace
6001 virtual_incoming_args_rtx with the virtual register. */
6003 static void
6004 expand_stack_alignment (void)
6006 rtx drap_rtx;
6007 unsigned int preferred_stack_boundary;
6009 if (! SUPPORTS_STACK_ALIGNMENT)
6010 return;
6012 if (cfun->calls_alloca
6013 || cfun->has_nonlocal_label
6014 || crtl->has_nonlocal_goto)
6015 crtl->need_drap = true;
6017 /* Call update_stack_boundary here again to update incoming stack
6018 boundary. It may set incoming stack alignment to a different
6019 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6020 use the minimum incoming stack alignment to check if it is OK
6021 to perform sibcall optimization since sibcall optimization will
6022 only align the outgoing stack to incoming stack boundary. */
6023 if (targetm.calls.update_stack_boundary)
6024 targetm.calls.update_stack_boundary ();
6026 /* The incoming stack frame has to be aligned at least at
6027 parm_stack_boundary. */
6028 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6030 /* Update crtl->stack_alignment_estimated and use it later to align
6031 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6032 exceptions since callgraph doesn't collect incoming stack alignment
6033 in this case. */
6034 if (cfun->can_throw_non_call_exceptions
6035 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6036 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6037 else
6038 preferred_stack_boundary = crtl->preferred_stack_boundary;
6039 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6040 crtl->stack_alignment_estimated = preferred_stack_boundary;
6041 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6042 crtl->stack_alignment_needed = preferred_stack_boundary;
6044 gcc_assert (crtl->stack_alignment_needed
6045 <= crtl->stack_alignment_estimated);
6047 crtl->stack_realign_needed
6048 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6049 crtl->stack_realign_tried = crtl->stack_realign_needed;
6051 crtl->stack_realign_processed = true;
6053 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6054 alignment. */
6055 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6056 drap_rtx = targetm.calls.get_drap_rtx ();
6058 /* stack_realign_drap and drap_rtx must match. */
6059 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6061 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6062 if (NULL != drap_rtx)
6064 crtl->args.internal_arg_pointer = drap_rtx;
6066 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6067 needed. */
6068 fixup_tail_calls ();
6073 static void
6074 expand_main_function (void)
6076 #if (defined(INVOKE__main) \
6077 || (!defined(HAS_INIT_SECTION) \
6078 && !defined(INIT_SECTION_ASM_OP) \
6079 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6080 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode, 0);
6081 #endif
6085 /* Expand code to initialize the stack_protect_guard. This is invoked at
6086 the beginning of a function to be protected. */
6088 static void
6089 stack_protect_prologue (void)
6091 tree guard_decl = targetm.stack_protect_guard ();
6092 rtx x, y;
6094 x = expand_normal (crtl->stack_protect_guard);
6095 if (guard_decl)
6096 y = expand_normal (guard_decl);
6097 else
6098 y = const0_rtx;
6100 /* Allow the target to copy from Y to X without leaking Y into a
6101 register. */
6102 if (targetm.have_stack_protect_set ())
6103 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6105 emit_insn (insn);
6106 return;
6109 /* Otherwise do a straight move. */
6110 emit_move_insn (x, y);
6113 /* Translate the intermediate representation contained in the CFG
6114 from GIMPLE trees to RTL.
6116 We do conversion per basic block and preserve/update the tree CFG.
6117 This implies we have to do some magic as the CFG can simultaneously
6118 consist of basic blocks containing RTL and GIMPLE trees. This can
6119 confuse the CFG hooks, so be careful to not manipulate CFG during
6120 the expansion. */
6122 namespace {
6124 const pass_data pass_data_expand =
6126 RTL_PASS, /* type */
6127 "expand", /* name */
6128 OPTGROUP_NONE, /* optinfo_flags */
6129 TV_EXPAND, /* tv_id */
6130 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6131 | PROP_gimple_lcx
6132 | PROP_gimple_lvec
6133 | PROP_gimple_lva), /* properties_required */
6134 PROP_rtl, /* properties_provided */
6135 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
6136 0, /* todo_flags_start */
6137 0, /* todo_flags_finish */
6140 class pass_expand : public rtl_opt_pass
6142 public:
6143 pass_expand (gcc::context *ctxt)
6144 : rtl_opt_pass (pass_data_expand, ctxt)
6147 /* opt_pass methods: */
6148 virtual unsigned int execute (function *);
6150 }; // class pass_expand
6152 unsigned int
6153 pass_expand::execute (function *fun)
6155 basic_block bb, init_block;
6156 edge_iterator ei;
6157 edge e;
6158 rtx_insn *var_seq, *var_ret_seq;
6159 unsigned i;
6161 timevar_push (TV_OUT_OF_SSA);
6162 rewrite_out_of_ssa (&SA);
6163 timevar_pop (TV_OUT_OF_SSA);
6164 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6166 if (MAY_HAVE_DEBUG_STMTS && flag_tree_ter)
6168 gimple_stmt_iterator gsi;
6169 FOR_EACH_BB_FN (bb, cfun)
6170 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6171 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6172 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6175 /* Make sure all values used by the optimization passes have sane
6176 defaults. */
6177 reg_renumber = 0;
6179 /* Some backends want to know that we are expanding to RTL. */
6180 currently_expanding_to_rtl = 1;
6181 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6182 free_dominance_info (CDI_DOMINATORS);
6184 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6186 if (chkp_function_instrumented_p (current_function_decl))
6187 chkp_reset_rtl_bounds ();
6189 insn_locations_init ();
6190 if (!DECL_IS_BUILTIN (current_function_decl))
6192 /* Eventually, all FEs should explicitly set function_start_locus. */
6193 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6194 set_curr_insn_location
6195 (DECL_SOURCE_LOCATION (current_function_decl));
6196 else
6197 set_curr_insn_location (fun->function_start_locus);
6199 else
6200 set_curr_insn_location (UNKNOWN_LOCATION);
6201 prologue_location = curr_insn_location ();
6203 #ifdef INSN_SCHEDULING
6204 init_sched_attrs ();
6205 #endif
6207 /* Make sure first insn is a note even if we don't want linenums.
6208 This makes sure the first insn will never be deleted.
6209 Also, final expects a note to appear there. */
6210 emit_note (NOTE_INSN_DELETED);
6212 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6213 discover_nonconstant_array_refs ();
6215 targetm.expand_to_rtl_hook ();
6216 crtl->init_stack_alignment ();
6217 fun->cfg->max_jumptable_ents = 0;
6219 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6220 of the function section at exapnsion time to predict distance of calls. */
6221 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6223 /* Expand the variables recorded during gimple lowering. */
6224 timevar_push (TV_VAR_EXPAND);
6225 start_sequence ();
6227 var_ret_seq = expand_used_vars ();
6229 var_seq = get_insns ();
6230 end_sequence ();
6231 timevar_pop (TV_VAR_EXPAND);
6233 /* Honor stack protection warnings. */
6234 if (warn_stack_protect)
6236 if (fun->calls_alloca)
6237 warning (OPT_Wstack_protector,
6238 "stack protector not protecting local variables: "
6239 "variable length buffer");
6240 if (has_short_buffer && !crtl->stack_protect_guard)
6241 warning (OPT_Wstack_protector,
6242 "stack protector not protecting function: "
6243 "all local arrays are less than %d bytes long",
6244 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE));
6247 /* Set up parameters and prepare for return, for the function. */
6248 expand_function_start (current_function_decl);
6250 /* If we emitted any instructions for setting up the variables,
6251 emit them before the FUNCTION_START note. */
6252 if (var_seq)
6254 emit_insn_before (var_seq, parm_birth_insn);
6256 /* In expand_function_end we'll insert the alloca save/restore
6257 before parm_birth_insn. We've just insertted an alloca call.
6258 Adjust the pointer to match. */
6259 parm_birth_insn = var_seq;
6262 /* Now propagate the RTL assignment of each partition to the
6263 underlying var of each SSA_NAME. */
6264 tree name;
6266 FOR_EACH_SSA_NAME (i, name, cfun)
6268 /* We might have generated new SSA names in
6269 update_alias_info_with_stack_vars. They will have a NULL
6270 defining statements, and won't be part of the partitioning,
6271 so ignore those. */
6272 if (!SSA_NAME_DEF_STMT (name))
6273 continue;
6275 adjust_one_expanded_partition_var (name);
6278 /* Clean up RTL of variables that straddle across multiple
6279 partitions, and check that the rtl of any PARM_DECLs that are not
6280 cleaned up is that of their default defs. */
6281 FOR_EACH_SSA_NAME (i, name, cfun)
6283 int part;
6285 /* We might have generated new SSA names in
6286 update_alias_info_with_stack_vars. They will have a NULL
6287 defining statements, and won't be part of the partitioning,
6288 so ignore those. */
6289 if (!SSA_NAME_DEF_STMT (name))
6290 continue;
6291 part = var_to_partition (SA.map, name);
6292 if (part == NO_PARTITION)
6293 continue;
6295 /* If this decl was marked as living in multiple places, reset
6296 this now to NULL. */
6297 tree var = SSA_NAME_VAR (name);
6298 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6299 SET_DECL_RTL (var, NULL);
6300 /* Check that the pseudos chosen by assign_parms are those of
6301 the corresponding default defs. */
6302 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6303 && (TREE_CODE (var) == PARM_DECL
6304 || TREE_CODE (var) == RESULT_DECL))
6306 rtx in = DECL_RTL_IF_SET (var);
6307 gcc_assert (in);
6308 rtx out = SA.partition_to_pseudo[part];
6309 gcc_assert (in == out);
6311 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6312 those expected by debug backends for each parm and for
6313 the result. This is particularly important for stabs,
6314 whose register elimination from parm's DECL_RTL may cause
6315 -fcompare-debug differences as SET_DECL_RTL changes reg's
6316 attrs. So, make sure the RTL already has the parm as the
6317 EXPR, so that it won't change. */
6318 SET_DECL_RTL (var, NULL_RTX);
6319 if (MEM_P (in))
6320 set_mem_attributes (in, var, true);
6321 SET_DECL_RTL (var, in);
6325 /* If this function is `main', emit a call to `__main'
6326 to run global initializers, etc. */
6327 if (DECL_NAME (current_function_decl)
6328 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6329 && DECL_FILE_SCOPE_P (current_function_decl))
6330 expand_main_function ();
6332 /* Initialize the stack_protect_guard field. This must happen after the
6333 call to __main (if any) so that the external decl is initialized. */
6334 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6335 stack_protect_prologue ();
6337 expand_phi_nodes (&SA);
6339 /* Release any stale SSA redirection data. */
6340 redirect_edge_var_map_empty ();
6342 /* Register rtl specific functions for cfg. */
6343 rtl_register_cfg_hooks ();
6345 init_block = construct_init_block ();
6347 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6348 remaining edges later. */
6349 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6350 e->flags &= ~EDGE_EXECUTABLE;
6352 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6353 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6354 next_bb)
6355 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6357 if (MAY_HAVE_DEBUG_INSNS)
6358 expand_debug_locations ();
6360 if (deep_ter_debug_map)
6362 delete deep_ter_debug_map;
6363 deep_ter_debug_map = NULL;
6366 /* Free stuff we no longer need after GIMPLE optimizations. */
6367 free_dominance_info (CDI_DOMINATORS);
6368 free_dominance_info (CDI_POST_DOMINATORS);
6369 delete_tree_cfg_annotations (fun);
6371 timevar_push (TV_OUT_OF_SSA);
6372 finish_out_of_ssa (&SA);
6373 timevar_pop (TV_OUT_OF_SSA);
6375 timevar_push (TV_POST_EXPAND);
6376 /* We are no longer in SSA form. */
6377 fun->gimple_df->in_ssa_p = false;
6378 loops_state_clear (LOOP_CLOSED_SSA);
6380 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6381 conservatively to true until they are all profile aware. */
6382 delete lab_rtx_for_bb;
6383 free_histograms (fun);
6385 construct_exit_block ();
6386 insn_locations_finalize ();
6388 if (var_ret_seq)
6390 rtx_insn *after = return_label;
6391 rtx_insn *next = NEXT_INSN (after);
6392 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6393 after = next;
6394 emit_insn_after (var_ret_seq, after);
6397 /* Zap the tree EH table. */
6398 set_eh_throw_stmt_table (fun, NULL);
6400 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6401 split edges which edge insertions might do. */
6402 rebuild_jump_labels (get_insns ());
6404 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun),
6405 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6407 edge e;
6408 edge_iterator ei;
6409 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6411 if (e->insns.r)
6413 rebuild_jump_labels_chain (e->insns.r);
6414 /* Put insns after parm birth, but before
6415 NOTE_INSNS_FUNCTION_BEG. */
6416 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (fun)
6417 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6419 rtx_insn *insns = e->insns.r;
6420 e->insns.r = NULL;
6421 if (NOTE_P (parm_birth_insn)
6422 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6423 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6424 else
6425 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6427 else
6428 commit_one_edge_insertion (e);
6430 else
6431 ei_next (&ei);
6435 /* We're done expanding trees to RTL. */
6436 currently_expanding_to_rtl = 0;
6438 flush_mark_addressable_queue ();
6440 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6441 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6443 edge e;
6444 edge_iterator ei;
6445 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6447 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6448 e->flags &= ~EDGE_EXECUTABLE;
6450 /* At the moment not all abnormal edges match the RTL
6451 representation. It is safe to remove them here as
6452 find_many_sub_basic_blocks will rediscover them.
6453 In the future we should get this fixed properly. */
6454 if ((e->flags & EDGE_ABNORMAL)
6455 && !(e->flags & EDGE_SIBCALL))
6456 remove_edge (e);
6457 else
6458 ei_next (&ei);
6462 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6463 bitmap_ones (blocks);
6464 find_many_sub_basic_blocks (blocks);
6465 purge_all_dead_edges ();
6467 expand_stack_alignment ();
6469 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6470 function. */
6471 if (crtl->tail_call_emit)
6472 fixup_tail_calls ();
6474 /* After initial rtl generation, call back to finish generating
6475 exception support code. We need to do this before cleaning up
6476 the CFG as the code does not expect dead landing pads. */
6477 if (fun->eh->region_tree != NULL)
6478 finish_eh_generation ();
6480 /* Remove unreachable blocks, otherwise we cannot compute dominators
6481 which are needed for loop state verification. As a side-effect
6482 this also compacts blocks.
6483 ??? We cannot remove trivially dead insns here as for example
6484 the DRAP reg on i?86 is not magically live at this point.
6485 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6486 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6488 checking_verify_flow_info ();
6490 /* Initialize pseudos allocated for hard registers. */
6491 emit_initial_value_sets ();
6493 /* And finally unshare all RTL. */
6494 unshare_all_rtl ();
6496 /* There's no need to defer outputting this function any more; we
6497 know we want to output it. */
6498 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6500 /* Now that we're done expanding trees to RTL, we shouldn't have any
6501 more CONCATs anywhere. */
6502 generating_concat_p = 0;
6504 if (dump_file)
6506 fprintf (dump_file,
6507 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6508 /* And the pass manager will dump RTL for us. */
6511 /* If we're emitting a nested function, make sure its parent gets
6512 emitted as well. Doing otherwise confuses debug info. */
6514 tree parent;
6515 for (parent = DECL_CONTEXT (current_function_decl);
6516 parent != NULL_TREE;
6517 parent = get_containing_scope (parent))
6518 if (TREE_CODE (parent) == FUNCTION_DECL)
6519 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6522 /* We are now committed to emitting code for this function. Do any
6523 preparation, such as emitting abstract debug info for the inline
6524 before it gets mangled by optimization. */
6525 if (cgraph_function_possibly_inlined_p (current_function_decl))
6526 (*debug_hooks->outlining_inline_function) (current_function_decl);
6528 TREE_ASM_WRITTEN (current_function_decl) = 1;
6530 /* After expanding, the return labels are no longer needed. */
6531 return_label = NULL;
6532 naked_return_label = NULL;
6534 /* After expanding, the tm_restart map is no longer needed. */
6535 if (fun->gimple_df->tm_restart)
6536 fun->gimple_df->tm_restart = NULL;
6538 /* Tag the blocks with a depth number so that change_scope can find
6539 the common parent easily. */
6540 set_block_levels (DECL_INITIAL (fun->decl), 0);
6541 default_rtl_profile ();
6543 /* For -dx discard loops now, otherwise IL verify in clean_state will
6544 ICE. */
6545 if (rtl_dump_and_exit)
6547 cfun->curr_properties &= ~PROP_loops;
6548 loop_optimizer_finalize ();
6551 timevar_pop (TV_POST_EXPAND);
6553 return 0;
6556 } // anon namespace
6558 rtl_opt_pass *
6559 make_pass_expand (gcc::context *ctxt)
6561 return new pass_expand (ctxt);