Daily bump.
[official-gcc.git] / gcc / cfgexpand.c
blobc9d8118ed4526d9a307d5d3c25883b1c6cb60620
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2017 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "params.h"
65 #include "tree-inline.h"
66 #include "value-prof.h"
67 #include "tree-ssa-live.h"
68 #include "tree-outof-ssa.h"
69 #include "cfgloop.h"
70 #include "insn-attr.h" /* For INSN_SCHEDULING. */
71 #include "asan.h"
72 #include "tree-ssa-address.h"
73 #include "output.h"
74 #include "builtins.h"
75 #include "tree-chkp.h"
76 #include "rtl-chkp.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple *currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 static bool defer_stack_allocation (tree, bool);
98 static void record_alignment_for_reg_var (unsigned int);
100 /* Return an expression tree corresponding to the RHS of GIMPLE
101 statement STMT. */
103 tree
104 gimple_assign_rhs_to_tree (gimple *stmt)
106 tree t;
107 enum gimple_rhs_class grhs_class;
109 grhs_class = get_gimple_rhs_class (gimple_expr_code (stmt));
111 if (grhs_class == GIMPLE_TERNARY_RHS)
112 t = build3 (gimple_assign_rhs_code (stmt),
113 TREE_TYPE (gimple_assign_lhs (stmt)),
114 gimple_assign_rhs1 (stmt),
115 gimple_assign_rhs2 (stmt),
116 gimple_assign_rhs3 (stmt));
117 else if (grhs_class == GIMPLE_BINARY_RHS)
118 t = build2 (gimple_assign_rhs_code (stmt),
119 TREE_TYPE (gimple_assign_lhs (stmt)),
120 gimple_assign_rhs1 (stmt),
121 gimple_assign_rhs2 (stmt));
122 else if (grhs_class == GIMPLE_UNARY_RHS)
123 t = build1 (gimple_assign_rhs_code (stmt),
124 TREE_TYPE (gimple_assign_lhs (stmt)),
125 gimple_assign_rhs1 (stmt));
126 else if (grhs_class == GIMPLE_SINGLE_RHS)
128 t = gimple_assign_rhs1 (stmt);
129 /* Avoid modifying this tree in place below. */
130 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
131 && gimple_location (stmt) != EXPR_LOCATION (t))
132 || (gimple_block (stmt)
133 && currently_expanding_to_rtl
134 && EXPR_P (t)))
135 t = copy_node (t);
137 else
138 gcc_unreachable ();
140 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
141 SET_EXPR_LOCATION (t, gimple_location (stmt));
143 return t;
147 #ifndef STACK_ALIGNMENT_NEEDED
148 #define STACK_ALIGNMENT_NEEDED 1
149 #endif
151 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
153 /* Choose either CUR or NEXT as the leader DECL for a partition.
154 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
155 out of the same user variable being in multiple partitions (this is
156 less likely for compiler-introduced temps). */
158 static tree
159 leader_merge (tree cur, tree next)
161 if (cur == NULL || cur == next)
162 return next;
164 if (DECL_P (cur) && DECL_IGNORED_P (cur))
165 return cur;
167 if (DECL_P (next) && DECL_IGNORED_P (next))
168 return next;
170 return cur;
173 /* Associate declaration T with storage space X. If T is no
174 SSA name this is exactly SET_DECL_RTL, otherwise make the
175 partition of T associated with X. */
176 static inline void
177 set_rtl (tree t, rtx x)
179 gcc_checking_assert (!x
180 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
181 || (use_register_for_decl (t)
182 ? (REG_P (x)
183 || (GET_CODE (x) == CONCAT
184 && (REG_P (XEXP (x, 0))
185 || SUBREG_P (XEXP (x, 0)))
186 && (REG_P (XEXP (x, 1))
187 || SUBREG_P (XEXP (x, 1))))
188 /* We need to accept PARALLELs for RESUT_DECLs
189 because of vector types with BLKmode returned
190 in multiple registers, but they are supposed
191 to be uncoalesced. */
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && (GET_MODE (x) == BLKmode
196 || !flag_tree_coalesce_vars)))
197 : (MEM_P (x) || x == pc_rtx
198 || (GET_CODE (x) == CONCAT
199 && MEM_P (XEXP (x, 0))
200 && MEM_P (XEXP (x, 1))))));
201 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
202 RESULT_DECLs has the expected mode. For memory, we accept
203 unpromoted modes, since that's what we're likely to get. For
204 PARM_DECLs and RESULT_DECLs, we'll have been called by
205 set_parm_rtl, which will give us the default def, so we don't
206 have to compute it ourselves. For RESULT_DECLs, we accept mode
207 mismatches too, as long as we have BLKmode or are not coalescing
208 across variables, so that we don't reject BLKmode PARALLELs or
209 unpromoted REGs. */
210 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
211 || (SSAVAR (t)
212 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
213 && (promote_ssa_mode (t, NULL) == BLKmode
214 || !flag_tree_coalesce_vars))
215 || !use_register_for_decl (t)
216 || GET_MODE (x) == promote_ssa_mode (t, NULL));
218 if (x)
220 bool skip = false;
221 tree cur = NULL_TREE;
222 rtx xm = x;
224 retry:
225 if (MEM_P (xm))
226 cur = MEM_EXPR (xm);
227 else if (REG_P (xm))
228 cur = REG_EXPR (xm);
229 else if (SUBREG_P (xm))
231 gcc_assert (subreg_lowpart_p (xm));
232 xm = SUBREG_REG (xm);
233 goto retry;
235 else if (GET_CODE (xm) == CONCAT)
237 xm = XEXP (xm, 0);
238 goto retry;
240 else if (GET_CODE (xm) == PARALLEL)
242 xm = XVECEXP (xm, 0, 0);
243 gcc_assert (GET_CODE (xm) == EXPR_LIST);
244 xm = XEXP (xm, 0);
245 goto retry;
247 else if (xm == pc_rtx)
248 skip = true;
249 else
250 gcc_unreachable ();
252 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
254 if (cur != next)
256 if (MEM_P (x))
257 set_mem_attributes (x,
258 next && TREE_CODE (next) == SSA_NAME
259 ? TREE_TYPE (next)
260 : next, true);
261 else
262 set_reg_attrs_for_decl_rtl (next, x);
266 if (TREE_CODE (t) == SSA_NAME)
268 int part = var_to_partition (SA.map, t);
269 if (part != NO_PARTITION)
271 if (SA.partition_to_pseudo[part])
272 gcc_assert (SA.partition_to_pseudo[part] == x);
273 else if (x != pc_rtx)
274 SA.partition_to_pseudo[part] = x;
276 /* For the benefit of debug information at -O0 (where
277 vartracking doesn't run) record the place also in the base
278 DECL. For PARMs and RESULTs, do so only when setting the
279 default def. */
280 if (x && x != pc_rtx && SSA_NAME_VAR (t)
281 && (VAR_P (SSA_NAME_VAR (t))
282 || SSA_NAME_IS_DEFAULT_DEF (t)))
284 tree var = SSA_NAME_VAR (t);
285 /* If we don't yet have something recorded, just record it now. */
286 if (!DECL_RTL_SET_P (var))
287 SET_DECL_RTL (var, x);
288 /* If we have it set already to "multiple places" don't
289 change this. */
290 else if (DECL_RTL (var) == pc_rtx)
292 /* If we have something recorded and it's not the same place
293 as we want to record now, we have multiple partitions for the
294 same base variable, with different places. We can't just
295 randomly chose one, hence we have to say that we don't know.
296 This only happens with optimization, and there var-tracking
297 will figure out the right thing. */
298 else if (DECL_RTL (var) != x)
299 SET_DECL_RTL (var, pc_rtx);
302 else
303 SET_DECL_RTL (t, x);
306 /* This structure holds data relevant to one variable that will be
307 placed in a stack slot. */
308 struct stack_var
310 /* The Variable. */
311 tree decl;
313 /* Initially, the size of the variable. Later, the size of the partition,
314 if this variable becomes it's partition's representative. */
315 HOST_WIDE_INT size;
317 /* The *byte* alignment required for this variable. Or as, with the
318 size, the alignment for this partition. */
319 unsigned int alignb;
321 /* The partition representative. */
322 size_t representative;
324 /* The next stack variable in the partition, or EOC. */
325 size_t next;
327 /* The numbers of conflicting stack variables. */
328 bitmap conflicts;
331 #define EOC ((size_t)-1)
333 /* We have an array of such objects while deciding allocation. */
334 static struct stack_var *stack_vars;
335 static size_t stack_vars_alloc;
336 static size_t stack_vars_num;
337 static hash_map<tree, size_t> *decl_to_stack_part;
339 /* Conflict bitmaps go on this obstack. This allows us to destroy
340 all of them in one big sweep. */
341 static bitmap_obstack stack_var_bitmap_obstack;
343 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
344 is non-decreasing. */
345 static size_t *stack_vars_sorted;
347 /* The phase of the stack frame. This is the known misalignment of
348 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
349 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
350 static int frame_phase;
352 /* Used during expand_used_vars to remember if we saw any decls for
353 which we'd like to enable stack smashing protection. */
354 static bool has_protected_decls;
356 /* Used during expand_used_vars. Remember if we say a character buffer
357 smaller than our cutoff threshold. Used for -Wstack-protector. */
358 static bool has_short_buffer;
360 /* Compute the byte alignment to use for DECL. Ignore alignment
361 we can't do with expected alignment of the stack boundary. */
363 static unsigned int
364 align_local_variable (tree decl)
366 unsigned int align;
368 if (TREE_CODE (decl) == SSA_NAME)
369 align = TYPE_ALIGN (TREE_TYPE (decl));
370 else
372 align = LOCAL_DECL_ALIGNMENT (decl);
373 SET_DECL_ALIGN (decl, align);
375 return align / BITS_PER_UNIT;
378 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
379 down otherwise. Return truncated BASE value. */
381 static inline unsigned HOST_WIDE_INT
382 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
384 return align_up ? (base + align - 1) & -align : base & -align;
387 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
388 Return the frame offset. */
390 static HOST_WIDE_INT
391 alloc_stack_frame_space (HOST_WIDE_INT size, unsigned HOST_WIDE_INT align)
393 HOST_WIDE_INT offset, new_frame_offset;
395 if (FRAME_GROWS_DOWNWARD)
397 new_frame_offset
398 = align_base (frame_offset - frame_phase - size,
399 align, false) + frame_phase;
400 offset = new_frame_offset;
402 else
404 new_frame_offset
405 = align_base (frame_offset - frame_phase, align, true) + frame_phase;
406 offset = new_frame_offset;
407 new_frame_offset += size;
409 frame_offset = new_frame_offset;
411 if (frame_offset_overflow (frame_offset, cfun->decl))
412 frame_offset = offset = 0;
414 return offset;
417 /* Accumulate DECL into STACK_VARS. */
419 static void
420 add_stack_var (tree decl)
422 struct stack_var *v;
424 if (stack_vars_num >= stack_vars_alloc)
426 if (stack_vars_alloc)
427 stack_vars_alloc = stack_vars_alloc * 3 / 2;
428 else
429 stack_vars_alloc = 32;
430 stack_vars
431 = XRESIZEVEC (struct stack_var, stack_vars, stack_vars_alloc);
433 if (!decl_to_stack_part)
434 decl_to_stack_part = new hash_map<tree, size_t>;
436 v = &stack_vars[stack_vars_num];
437 decl_to_stack_part->put (decl, stack_vars_num);
439 v->decl = decl;
440 tree size = TREE_CODE (decl) == SSA_NAME
441 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
442 : DECL_SIZE_UNIT (decl);
443 v->size = tree_to_uhwi (size);
444 /* Ensure that all variables have size, so that &a != &b for any two
445 variables that are simultaneously live. */
446 if (v->size == 0)
447 v->size = 1;
448 v->alignb = align_local_variable (decl);
449 /* An alignment of zero can mightily confuse us later. */
450 gcc_assert (v->alignb != 0);
452 /* All variables are initially in their own partition. */
453 v->representative = stack_vars_num;
454 v->next = EOC;
456 /* All variables initially conflict with no other. */
457 v->conflicts = NULL;
459 /* Ensure that this decl doesn't get put onto the list twice. */
460 set_rtl (decl, pc_rtx);
462 stack_vars_num++;
465 /* Make the decls associated with luid's X and Y conflict. */
467 static void
468 add_stack_var_conflict (size_t x, size_t y)
470 struct stack_var *a = &stack_vars[x];
471 struct stack_var *b = &stack_vars[y];
472 if (!a->conflicts)
473 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
474 if (!b->conflicts)
475 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
476 bitmap_set_bit (a->conflicts, y);
477 bitmap_set_bit (b->conflicts, x);
480 /* Check whether the decls associated with luid's X and Y conflict. */
482 static bool
483 stack_var_conflict_p (size_t x, size_t y)
485 struct stack_var *a = &stack_vars[x];
486 struct stack_var *b = &stack_vars[y];
487 if (x == y)
488 return false;
489 /* Partitions containing an SSA name result from gimple registers
490 with things like unsupported modes. They are top-level and
491 hence conflict with everything else. */
492 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
493 return true;
495 if (!a->conflicts || !b->conflicts)
496 return false;
497 return bitmap_bit_p (a->conflicts, y);
500 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
501 enter its partition number into bitmap DATA. */
503 static bool
504 visit_op (gimple *, tree op, tree, void *data)
506 bitmap active = (bitmap)data;
507 op = get_base_address (op);
508 if (op
509 && DECL_P (op)
510 && DECL_RTL_IF_SET (op) == pc_rtx)
512 size_t *v = decl_to_stack_part->get (op);
513 if (v)
514 bitmap_set_bit (active, *v);
516 return false;
519 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
520 record conflicts between it and all currently active other partitions
521 from bitmap DATA. */
523 static bool
524 visit_conflict (gimple *, tree op, tree, void *data)
526 bitmap active = (bitmap)data;
527 op = get_base_address (op);
528 if (op
529 && DECL_P (op)
530 && DECL_RTL_IF_SET (op) == pc_rtx)
532 size_t *v = decl_to_stack_part->get (op);
533 if (v && bitmap_set_bit (active, *v))
535 size_t num = *v;
536 bitmap_iterator bi;
537 unsigned i;
538 gcc_assert (num < stack_vars_num);
539 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
540 add_stack_var_conflict (num, i);
543 return false;
546 /* Helper routine for add_scope_conflicts, calculating the active partitions
547 at the end of BB, leaving the result in WORK. We're called to generate
548 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
549 liveness. */
551 static void
552 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
554 edge e;
555 edge_iterator ei;
556 gimple_stmt_iterator gsi;
557 walk_stmt_load_store_addr_fn visit;
559 bitmap_clear (work);
560 FOR_EACH_EDGE (e, ei, bb->preds)
561 bitmap_ior_into (work, (bitmap)e->src->aux);
563 visit = visit_op;
565 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
567 gimple *stmt = gsi_stmt (gsi);
568 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
570 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
572 gimple *stmt = gsi_stmt (gsi);
574 if (gimple_clobber_p (stmt))
576 tree lhs = gimple_assign_lhs (stmt);
577 size_t *v;
578 /* Nested function lowering might introduce LHSs
579 that are COMPONENT_REFs. */
580 if (!VAR_P (lhs))
581 continue;
582 if (DECL_RTL_IF_SET (lhs) == pc_rtx
583 && (v = decl_to_stack_part->get (lhs)))
584 bitmap_clear_bit (work, *v);
586 else if (!is_gimple_debug (stmt))
588 if (for_conflict
589 && visit == visit_op)
591 /* If this is the first real instruction in this BB we need
592 to add conflicts for everything live at this point now.
593 Unlike classical liveness for named objects we can't
594 rely on seeing a def/use of the names we're interested in.
595 There might merely be indirect loads/stores. We'd not add any
596 conflicts for such partitions. */
597 bitmap_iterator bi;
598 unsigned i;
599 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
601 struct stack_var *a = &stack_vars[i];
602 if (!a->conflicts)
603 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
604 bitmap_ior_into (a->conflicts, work);
606 visit = visit_conflict;
608 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
613 /* Generate stack partition conflicts between all partitions that are
614 simultaneously live. */
616 static void
617 add_scope_conflicts (void)
619 basic_block bb;
620 bool changed;
621 bitmap work = BITMAP_ALLOC (NULL);
622 int *rpo;
623 int n_bbs;
625 /* We approximate the live range of a stack variable by taking the first
626 mention of its name as starting point(s), and by the end-of-scope
627 death clobber added by gimplify as ending point(s) of the range.
628 This overapproximates in the case we for instance moved an address-taken
629 operation upward, without also moving a dereference to it upwards.
630 But it's conservatively correct as a variable never can hold values
631 before its name is mentioned at least once.
633 We then do a mostly classical bitmap liveness algorithm. */
635 FOR_ALL_BB_FN (bb, cfun)
636 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
638 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
639 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
641 changed = true;
642 while (changed)
644 int i;
645 changed = false;
646 for (i = 0; i < n_bbs; i++)
648 bitmap active;
649 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
650 active = (bitmap)bb->aux;
651 add_scope_conflicts_1 (bb, work, false);
652 if (bitmap_ior_into (active, work))
653 changed = true;
657 FOR_EACH_BB_FN (bb, cfun)
658 add_scope_conflicts_1 (bb, work, true);
660 free (rpo);
661 BITMAP_FREE (work);
662 FOR_ALL_BB_FN (bb, cfun)
663 BITMAP_FREE (bb->aux);
666 /* A subroutine of partition_stack_vars. A comparison function for qsort,
667 sorting an array of indices by the properties of the object. */
669 static int
670 stack_var_cmp (const void *a, const void *b)
672 size_t ia = *(const size_t *)a;
673 size_t ib = *(const size_t *)b;
674 unsigned int aligna = stack_vars[ia].alignb;
675 unsigned int alignb = stack_vars[ib].alignb;
676 HOST_WIDE_INT sizea = stack_vars[ia].size;
677 HOST_WIDE_INT sizeb = stack_vars[ib].size;
678 tree decla = stack_vars[ia].decl;
679 tree declb = stack_vars[ib].decl;
680 bool largea, largeb;
681 unsigned int uida, uidb;
683 /* Primary compare on "large" alignment. Large comes first. */
684 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
685 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
686 if (largea != largeb)
687 return (int)largeb - (int)largea;
689 /* Secondary compare on size, decreasing */
690 if (sizea > sizeb)
691 return -1;
692 if (sizea < sizeb)
693 return 1;
695 /* Tertiary compare on true alignment, decreasing. */
696 if (aligna < alignb)
697 return -1;
698 if (aligna > alignb)
699 return 1;
701 /* Final compare on ID for sort stability, increasing.
702 Two SSA names are compared by their version, SSA names come before
703 non-SSA names, and two normal decls are compared by their DECL_UID. */
704 if (TREE_CODE (decla) == SSA_NAME)
706 if (TREE_CODE (declb) == SSA_NAME)
707 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
708 else
709 return -1;
711 else if (TREE_CODE (declb) == SSA_NAME)
712 return 1;
713 else
714 uida = DECL_UID (decla), uidb = DECL_UID (declb);
715 if (uida < uidb)
716 return 1;
717 if (uida > uidb)
718 return -1;
719 return 0;
722 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
723 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
725 /* If the points-to solution *PI points to variables that are in a partition
726 together with other variables add all partition members to the pointed-to
727 variables bitmap. */
729 static void
730 add_partitioned_vars_to_ptset (struct pt_solution *pt,
731 part_hashmap *decls_to_partitions,
732 hash_set<bitmap> *visited, bitmap temp)
734 bitmap_iterator bi;
735 unsigned i;
736 bitmap *part;
738 if (pt->anything
739 || pt->vars == NULL
740 /* The pointed-to vars bitmap is shared, it is enough to
741 visit it once. */
742 || visited->add (pt->vars))
743 return;
745 bitmap_clear (temp);
747 /* By using a temporary bitmap to store all members of the partitions
748 we have to add we make sure to visit each of the partitions only
749 once. */
750 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
751 if ((!temp
752 || !bitmap_bit_p (temp, i))
753 && (part = decls_to_partitions->get (i)))
754 bitmap_ior_into (temp, *part);
755 if (!bitmap_empty_p (temp))
756 bitmap_ior_into (pt->vars, temp);
759 /* Update points-to sets based on partition info, so we can use them on RTL.
760 The bitmaps representing stack partitions will be saved until expand,
761 where partitioned decls used as bases in memory expressions will be
762 rewritten. */
764 static void
765 update_alias_info_with_stack_vars (void)
767 part_hashmap *decls_to_partitions = NULL;
768 size_t i, j;
769 tree var = NULL_TREE;
771 for (i = 0; i < stack_vars_num; i++)
773 bitmap part = NULL;
774 tree name;
775 struct ptr_info_def *pi;
777 /* Not interested in partitions with single variable. */
778 if (stack_vars[i].representative != i
779 || stack_vars[i].next == EOC)
780 continue;
782 if (!decls_to_partitions)
784 decls_to_partitions = new part_hashmap;
785 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
788 /* Create an SSA_NAME that points to the partition for use
789 as base during alias-oracle queries on RTL for bases that
790 have been partitioned. */
791 if (var == NULL_TREE)
792 var = create_tmp_var (ptr_type_node);
793 name = make_ssa_name (var);
795 /* Create bitmaps representing partitions. They will be used for
796 points-to sets later, so use GGC alloc. */
797 part = BITMAP_GGC_ALLOC ();
798 for (j = i; j != EOC; j = stack_vars[j].next)
800 tree decl = stack_vars[j].decl;
801 unsigned int uid = DECL_PT_UID (decl);
802 bitmap_set_bit (part, uid);
803 decls_to_partitions->put (uid, part);
804 cfun->gimple_df->decls_to_pointers->put (decl, name);
805 if (TREE_ADDRESSABLE (decl))
806 TREE_ADDRESSABLE (name) = 1;
809 /* Make the SSA name point to all partition members. */
810 pi = get_ptr_info (name);
811 pt_solution_set (&pi->pt, part, false);
814 /* Make all points-to sets that contain one member of a partition
815 contain all members of the partition. */
816 if (decls_to_partitions)
818 unsigned i;
819 tree name;
820 hash_set<bitmap> visited;
821 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
823 FOR_EACH_SSA_NAME (i, name, cfun)
825 struct ptr_info_def *pi;
827 if (POINTER_TYPE_P (TREE_TYPE (name))
828 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
829 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
830 &visited, temp);
833 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
834 decls_to_partitions, &visited, temp);
836 delete decls_to_partitions;
837 BITMAP_FREE (temp);
841 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
842 partitioning algorithm. Partitions A and B are known to be non-conflicting.
843 Merge them into a single partition A. */
845 static void
846 union_stack_vars (size_t a, size_t b)
848 struct stack_var *vb = &stack_vars[b];
849 bitmap_iterator bi;
850 unsigned u;
852 gcc_assert (stack_vars[b].next == EOC);
853 /* Add B to A's partition. */
854 stack_vars[b].next = stack_vars[a].next;
855 stack_vars[b].representative = a;
856 stack_vars[a].next = b;
858 /* Update the required alignment of partition A to account for B. */
859 if (stack_vars[a].alignb < stack_vars[b].alignb)
860 stack_vars[a].alignb = stack_vars[b].alignb;
862 /* Update the interference graph and merge the conflicts. */
863 if (vb->conflicts)
865 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
866 add_stack_var_conflict (a, stack_vars[u].representative);
867 BITMAP_FREE (vb->conflicts);
871 /* A subroutine of expand_used_vars. Binpack the variables into
872 partitions constrained by the interference graph. The overall
873 algorithm used is as follows:
875 Sort the objects by size in descending order.
876 For each object A {
877 S = size(A)
878 O = 0
879 loop {
880 Look for the largest non-conflicting object B with size <= S.
881 UNION (A, B)
886 static void
887 partition_stack_vars (void)
889 size_t si, sj, n = stack_vars_num;
891 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
892 for (si = 0; si < n; ++si)
893 stack_vars_sorted[si] = si;
895 if (n == 1)
896 return;
898 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
900 for (si = 0; si < n; ++si)
902 size_t i = stack_vars_sorted[si];
903 unsigned int ialign = stack_vars[i].alignb;
904 HOST_WIDE_INT isize = stack_vars[i].size;
906 /* Ignore objects that aren't partition representatives. If we
907 see a var that is not a partition representative, it must
908 have been merged earlier. */
909 if (stack_vars[i].representative != i)
910 continue;
912 for (sj = si + 1; sj < n; ++sj)
914 size_t j = stack_vars_sorted[sj];
915 unsigned int jalign = stack_vars[j].alignb;
916 HOST_WIDE_INT jsize = stack_vars[j].size;
918 /* Ignore objects that aren't partition representatives. */
919 if (stack_vars[j].representative != j)
920 continue;
922 /* Do not mix objects of "small" (supported) alignment
923 and "large" (unsupported) alignment. */
924 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
925 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
926 break;
928 /* For Address Sanitizer do not mix objects with different
929 sizes, as the shorter vars wouldn't be adequately protected.
930 Don't do that for "large" (unsupported) alignment objects,
931 those aren't protected anyway. */
932 if ((asan_sanitize_stack_p ())
933 && isize != jsize
934 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
935 break;
937 /* Ignore conflicting objects. */
938 if (stack_var_conflict_p (i, j))
939 continue;
941 /* UNION the objects, placing J at OFFSET. */
942 union_stack_vars (i, j);
946 update_alias_info_with_stack_vars ();
949 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
951 static void
952 dump_stack_var_partition (void)
954 size_t si, i, j, n = stack_vars_num;
956 for (si = 0; si < n; ++si)
958 i = stack_vars_sorted[si];
960 /* Skip variables that aren't partition representatives, for now. */
961 if (stack_vars[i].representative != i)
962 continue;
964 fprintf (dump_file, "Partition %lu: size " HOST_WIDE_INT_PRINT_DEC
965 " align %u\n", (unsigned long) i, stack_vars[i].size,
966 stack_vars[i].alignb);
968 for (j = i; j != EOC; j = stack_vars[j].next)
970 fputc ('\t', dump_file);
971 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
973 fputc ('\n', dump_file);
977 /* Assign rtl to DECL at BASE + OFFSET. */
979 static void
980 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
981 HOST_WIDE_INT offset)
983 unsigned align;
984 rtx x;
986 /* If this fails, we've overflowed the stack frame. Error nicely? */
987 gcc_assert (offset == trunc_int_for_mode (offset, Pmode));
989 x = plus_constant (Pmode, base, offset);
990 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
991 ? TYPE_MODE (TREE_TYPE (decl))
992 : DECL_MODE (SSAVAR (decl)), x);
994 if (TREE_CODE (decl) != SSA_NAME)
996 /* Set alignment we actually gave this decl if it isn't an SSA name.
997 If it is we generate stack slots only accidentally so it isn't as
998 important, we'll simply use the alignment that is already set. */
999 if (base == virtual_stack_vars_rtx)
1000 offset -= frame_phase;
1001 align = least_bit_hwi (offset);
1002 align *= BITS_PER_UNIT;
1003 if (align == 0 || align > base_align)
1004 align = base_align;
1006 /* One would think that we could assert that we're not decreasing
1007 alignment here, but (at least) the i386 port does exactly this
1008 via the MINIMUM_ALIGNMENT hook. */
1010 SET_DECL_ALIGN (decl, align);
1011 DECL_USER_ALIGN (decl) = 0;
1014 set_rtl (decl, x);
1017 struct stack_vars_data
1019 /* Vector of offset pairs, always end of some padding followed
1020 by start of the padding that needs Address Sanitizer protection.
1021 The vector is in reversed, highest offset pairs come first. */
1022 auto_vec<HOST_WIDE_INT> asan_vec;
1024 /* Vector of partition representative decls in between the paddings. */
1025 auto_vec<tree> asan_decl_vec;
1027 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1028 rtx asan_base;
1030 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1031 unsigned int asan_alignb;
1034 /* A subroutine of expand_used_vars. Give each partition representative
1035 a unique location within the stack frame. Update each partition member
1036 with that location. */
1038 static void
1039 expand_stack_vars (bool (*pred) (size_t), struct stack_vars_data *data)
1041 size_t si, i, j, n = stack_vars_num;
1042 HOST_WIDE_INT large_size = 0, large_alloc = 0;
1043 rtx large_base = NULL;
1044 unsigned large_align = 0;
1045 bool large_allocation_done = false;
1046 tree decl;
1048 /* Determine if there are any variables requiring "large" alignment.
1049 Since these are dynamically allocated, we only process these if
1050 no predicate involved. */
1051 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1052 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1054 /* Find the total size of these variables. */
1055 for (si = 0; si < n; ++si)
1057 unsigned alignb;
1059 i = stack_vars_sorted[si];
1060 alignb = stack_vars[i].alignb;
1062 /* All "large" alignment decls come before all "small" alignment
1063 decls, but "large" alignment decls are not sorted based on
1064 their alignment. Increase large_align to track the largest
1065 required alignment. */
1066 if ((alignb * BITS_PER_UNIT) > large_align)
1067 large_align = alignb * BITS_PER_UNIT;
1069 /* Stop when we get to the first decl with "small" alignment. */
1070 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1071 break;
1073 /* Skip variables that aren't partition representatives. */
1074 if (stack_vars[i].representative != i)
1075 continue;
1077 /* Skip variables that have already had rtl assigned. See also
1078 add_stack_var where we perpetrate this pc_rtx hack. */
1079 decl = stack_vars[i].decl;
1080 if (TREE_CODE (decl) == SSA_NAME
1081 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1082 : DECL_RTL (decl) != pc_rtx)
1083 continue;
1085 large_size += alignb - 1;
1086 large_size &= -(HOST_WIDE_INT)alignb;
1087 large_size += stack_vars[i].size;
1091 for (si = 0; si < n; ++si)
1093 rtx base;
1094 unsigned base_align, alignb;
1095 HOST_WIDE_INT offset;
1097 i = stack_vars_sorted[si];
1099 /* Skip variables that aren't partition representatives, for now. */
1100 if (stack_vars[i].representative != i)
1101 continue;
1103 /* Skip variables that have already had rtl assigned. See also
1104 add_stack_var where we perpetrate this pc_rtx hack. */
1105 decl = stack_vars[i].decl;
1106 if (TREE_CODE (decl) == SSA_NAME
1107 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1108 : DECL_RTL (decl) != pc_rtx)
1109 continue;
1111 /* Check the predicate to see whether this variable should be
1112 allocated in this pass. */
1113 if (pred && !pred (i))
1114 continue;
1116 alignb = stack_vars[i].alignb;
1117 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1119 base = virtual_stack_vars_rtx;
1120 if ((asan_sanitize_stack_p ())
1121 && pred)
1123 HOST_WIDE_INT prev_offset
1124 = align_base (frame_offset,
1125 MAX (alignb, ASAN_RED_ZONE_SIZE),
1126 !FRAME_GROWS_DOWNWARD);
1127 tree repr_decl = NULL_TREE;
1128 offset
1129 = alloc_stack_frame_space (stack_vars[i].size
1130 + ASAN_RED_ZONE_SIZE,
1131 MAX (alignb, ASAN_RED_ZONE_SIZE));
1133 data->asan_vec.safe_push (prev_offset);
1134 data->asan_vec.safe_push (offset + stack_vars[i].size);
1135 /* Find best representative of the partition.
1136 Prefer those with DECL_NAME, even better
1137 satisfying asan_protect_stack_decl predicate. */
1138 for (j = i; j != EOC; j = stack_vars[j].next)
1139 if (asan_protect_stack_decl (stack_vars[j].decl)
1140 && DECL_NAME (stack_vars[j].decl))
1142 repr_decl = stack_vars[j].decl;
1143 break;
1145 else if (repr_decl == NULL_TREE
1146 && DECL_P (stack_vars[j].decl)
1147 && DECL_NAME (stack_vars[j].decl))
1148 repr_decl = stack_vars[j].decl;
1149 if (repr_decl == NULL_TREE)
1150 repr_decl = stack_vars[i].decl;
1151 data->asan_decl_vec.safe_push (repr_decl);
1152 data->asan_alignb = MAX (data->asan_alignb, alignb);
1153 if (data->asan_base == NULL)
1154 data->asan_base = gen_reg_rtx (Pmode);
1155 base = data->asan_base;
1157 if (!STRICT_ALIGNMENT)
1158 base_align = crtl->max_used_stack_slot_alignment;
1159 else
1160 base_align = MAX (crtl->max_used_stack_slot_alignment,
1161 GET_MODE_ALIGNMENT (SImode)
1162 << ASAN_SHADOW_SHIFT);
1164 else
1166 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1167 base_align = crtl->max_used_stack_slot_alignment;
1170 else
1172 /* Large alignment is only processed in the last pass. */
1173 if (pred)
1174 continue;
1176 /* If there were any variables requiring "large" alignment, allocate
1177 space. */
1178 if (large_size > 0 && ! large_allocation_done)
1180 HOST_WIDE_INT loffset;
1181 rtx large_allocsize;
1183 large_allocsize = GEN_INT (large_size);
1184 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1185 loffset = alloc_stack_frame_space
1186 (INTVAL (large_allocsize),
1187 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1188 large_base = get_dynamic_stack_base (loffset, large_align);
1189 large_allocation_done = true;
1191 gcc_assert (large_base != NULL);
1193 large_alloc += alignb - 1;
1194 large_alloc &= -(HOST_WIDE_INT)alignb;
1195 offset = large_alloc;
1196 large_alloc += stack_vars[i].size;
1198 base = large_base;
1199 base_align = large_align;
1202 /* Create rtl for each variable based on their location within the
1203 partition. */
1204 for (j = i; j != EOC; j = stack_vars[j].next)
1206 expand_one_stack_var_at (stack_vars[j].decl,
1207 base, base_align,
1208 offset);
1212 gcc_assert (large_alloc == large_size);
1215 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1216 static HOST_WIDE_INT
1217 account_stack_vars (void)
1219 size_t si, j, i, n = stack_vars_num;
1220 HOST_WIDE_INT size = 0;
1222 for (si = 0; si < n; ++si)
1224 i = stack_vars_sorted[si];
1226 /* Skip variables that aren't partition representatives, for now. */
1227 if (stack_vars[i].representative != i)
1228 continue;
1230 size += stack_vars[i].size;
1231 for (j = i; j != EOC; j = stack_vars[j].next)
1232 set_rtl (stack_vars[j].decl, NULL);
1234 return size;
1237 /* Record the RTL assignment X for the default def of PARM. */
1239 extern void
1240 set_parm_rtl (tree parm, rtx x)
1242 gcc_assert (TREE_CODE (parm) == PARM_DECL
1243 || TREE_CODE (parm) == RESULT_DECL);
1245 if (x && !MEM_P (x))
1247 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1248 TYPE_MODE (TREE_TYPE (parm)),
1249 TYPE_ALIGN (TREE_TYPE (parm)));
1251 /* If the variable alignment is very large we'll dynamicaly
1252 allocate it, which means that in-frame portion is just a
1253 pointer. ??? We've got a pseudo for sure here, do we
1254 actually dynamically allocate its spilling area if needed?
1255 ??? Isn't it a problem when POINTER_SIZE also exceeds
1256 MAX_SUPPORTED_STACK_ALIGNMENT, as on cris and lm32? */
1257 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1258 align = POINTER_SIZE;
1260 record_alignment_for_reg_var (align);
1263 tree ssa = ssa_default_def (cfun, parm);
1264 if (!ssa)
1265 return set_rtl (parm, x);
1267 int part = var_to_partition (SA.map, ssa);
1268 gcc_assert (part != NO_PARTITION);
1270 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1271 gcc_assert (changed);
1273 set_rtl (ssa, x);
1274 gcc_assert (DECL_RTL (parm) == x);
1277 /* A subroutine of expand_one_var. Called to immediately assign rtl
1278 to a variable to be allocated in the stack frame. */
1280 static void
1281 expand_one_stack_var_1 (tree var)
1283 HOST_WIDE_INT size, offset;
1284 unsigned byte_align;
1286 if (TREE_CODE (var) == SSA_NAME)
1288 tree type = TREE_TYPE (var);
1289 size = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1290 byte_align = TYPE_ALIGN_UNIT (type);
1292 else
1294 size = tree_to_uhwi (DECL_SIZE_UNIT (var));
1295 byte_align = align_local_variable (var);
1298 /* We handle highly aligned variables in expand_stack_vars. */
1299 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1301 offset = alloc_stack_frame_space (size, byte_align);
1303 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1304 crtl->max_used_stack_slot_alignment, offset);
1307 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1308 already assigned some MEM. */
1310 static void
1311 expand_one_stack_var (tree var)
1313 if (TREE_CODE (var) == SSA_NAME)
1315 int part = var_to_partition (SA.map, var);
1316 if (part != NO_PARTITION)
1318 rtx x = SA.partition_to_pseudo[part];
1319 gcc_assert (x);
1320 gcc_assert (MEM_P (x));
1321 return;
1325 return expand_one_stack_var_1 (var);
1328 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1329 that will reside in a hard register. */
1331 static void
1332 expand_one_hard_reg_var (tree var)
1334 rest_of_decl_compilation (var, 0, 0);
1337 /* Record the alignment requirements of some variable assigned to a
1338 pseudo. */
1340 static void
1341 record_alignment_for_reg_var (unsigned int align)
1343 if (SUPPORTS_STACK_ALIGNMENT
1344 && crtl->stack_alignment_estimated < align)
1346 /* stack_alignment_estimated shouldn't change after stack
1347 realign decision made */
1348 gcc_assert (!crtl->stack_realign_processed);
1349 crtl->stack_alignment_estimated = align;
1352 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1353 So here we only make sure stack_alignment_needed >= align. */
1354 if (crtl->stack_alignment_needed < align)
1355 crtl->stack_alignment_needed = align;
1356 if (crtl->max_used_stack_slot_alignment < align)
1357 crtl->max_used_stack_slot_alignment = align;
1360 /* Create RTL for an SSA partition. */
1362 static void
1363 expand_one_ssa_partition (tree var)
1365 int part = var_to_partition (SA.map, var);
1366 gcc_assert (part != NO_PARTITION);
1368 if (SA.partition_to_pseudo[part])
1369 return;
1371 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1372 TYPE_MODE (TREE_TYPE (var)),
1373 TYPE_ALIGN (TREE_TYPE (var)));
1375 /* If the variable alignment is very large we'll dynamicaly allocate
1376 it, which means that in-frame portion is just a pointer. */
1377 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1378 align = POINTER_SIZE;
1380 record_alignment_for_reg_var (align);
1382 if (!use_register_for_decl (var))
1384 if (defer_stack_allocation (var, true))
1385 add_stack_var (var);
1386 else
1387 expand_one_stack_var_1 (var);
1388 return;
1391 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1393 rtx x = gen_reg_rtx (reg_mode);
1395 set_rtl (var, x);
1398 /* Record the association between the RTL generated for partition PART
1399 and the underlying variable of the SSA_NAME VAR. */
1401 static void
1402 adjust_one_expanded_partition_var (tree var)
1404 if (!var)
1405 return;
1407 tree decl = SSA_NAME_VAR (var);
1409 int part = var_to_partition (SA.map, var);
1410 if (part == NO_PARTITION)
1411 return;
1413 rtx x = SA.partition_to_pseudo[part];
1415 gcc_assert (x);
1417 set_rtl (var, x);
1419 if (!REG_P (x))
1420 return;
1422 /* Note if the object is a user variable. */
1423 if (decl && !DECL_ARTIFICIAL (decl))
1424 mark_user_reg (x);
1426 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1427 mark_reg_pointer (x, get_pointer_alignment (var));
1430 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1431 that will reside in a pseudo register. */
1433 static void
1434 expand_one_register_var (tree var)
1436 if (TREE_CODE (var) == SSA_NAME)
1438 int part = var_to_partition (SA.map, var);
1439 if (part != NO_PARTITION)
1441 rtx x = SA.partition_to_pseudo[part];
1442 gcc_assert (x);
1443 gcc_assert (REG_P (x));
1444 return;
1446 gcc_unreachable ();
1449 tree decl = var;
1450 tree type = TREE_TYPE (decl);
1451 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1452 rtx x = gen_reg_rtx (reg_mode);
1454 set_rtl (var, x);
1456 /* Note if the object is a user variable. */
1457 if (!DECL_ARTIFICIAL (decl))
1458 mark_user_reg (x);
1460 if (POINTER_TYPE_P (type))
1461 mark_reg_pointer (x, get_pointer_alignment (var));
1464 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1465 has some associated error, e.g. its type is error-mark. We just need
1466 to pick something that won't crash the rest of the compiler. */
1468 static void
1469 expand_one_error_var (tree var)
1471 machine_mode mode = DECL_MODE (var);
1472 rtx x;
1474 if (mode == BLKmode)
1475 x = gen_rtx_MEM (BLKmode, const0_rtx);
1476 else if (mode == VOIDmode)
1477 x = const0_rtx;
1478 else
1479 x = gen_reg_rtx (mode);
1481 SET_DECL_RTL (var, x);
1484 /* A subroutine of expand_one_var. VAR is a variable that will be
1485 allocated to the local stack frame. Return true if we wish to
1486 add VAR to STACK_VARS so that it will be coalesced with other
1487 variables. Return false to allocate VAR immediately.
1489 This function is used to reduce the number of variables considered
1490 for coalescing, which reduces the size of the quadratic problem. */
1492 static bool
1493 defer_stack_allocation (tree var, bool toplevel)
1495 tree size_unit = TREE_CODE (var) == SSA_NAME
1496 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1497 : DECL_SIZE_UNIT (var);
1499 /* Whether the variable is small enough for immediate allocation not to be
1500 a problem with regard to the frame size. */
1501 bool smallish
1502 = ((HOST_WIDE_INT) tree_to_uhwi (size_unit)
1503 < PARAM_VALUE (PARAM_MIN_SIZE_FOR_STACK_SHARING));
1505 /* If stack protection is enabled, *all* stack variables must be deferred,
1506 so that we can re-order the strings to the top of the frame.
1507 Similarly for Address Sanitizer. */
1508 if (flag_stack_protect || asan_sanitize_stack_p ())
1509 return true;
1511 unsigned int align = TREE_CODE (var) == SSA_NAME
1512 ? TYPE_ALIGN (TREE_TYPE (var))
1513 : DECL_ALIGN (var);
1515 /* We handle "large" alignment via dynamic allocation. We want to handle
1516 this extra complication in only one place, so defer them. */
1517 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1518 return true;
1520 bool ignored = TREE_CODE (var) == SSA_NAME
1521 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1522 : DECL_IGNORED_P (var);
1524 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1525 might be detached from their block and appear at toplevel when we reach
1526 here. We want to coalesce them with variables from other blocks when
1527 the immediate contribution to the frame size would be noticeable. */
1528 if (toplevel && optimize > 0 && ignored && !smallish)
1529 return true;
1531 /* Variables declared in the outermost scope automatically conflict
1532 with every other variable. The only reason to want to defer them
1533 at all is that, after sorting, we can more efficiently pack
1534 small variables in the stack frame. Continue to defer at -O2. */
1535 if (toplevel && optimize < 2)
1536 return false;
1538 /* Without optimization, *most* variables are allocated from the
1539 stack, which makes the quadratic problem large exactly when we
1540 want compilation to proceed as quickly as possible. On the
1541 other hand, we don't want the function's stack frame size to
1542 get completely out of hand. So we avoid adding scalars and
1543 "small" aggregates to the list at all. */
1544 if (optimize == 0 && smallish)
1545 return false;
1547 return true;
1550 /* A subroutine of expand_used_vars. Expand one variable according to
1551 its flavor. Variables to be placed on the stack are not actually
1552 expanded yet, merely recorded.
1553 When REALLY_EXPAND is false, only add stack values to be allocated.
1554 Return stack usage this variable is supposed to take.
1557 static HOST_WIDE_INT
1558 expand_one_var (tree var, bool toplevel, bool really_expand)
1560 unsigned int align = BITS_PER_UNIT;
1561 tree origvar = var;
1563 var = SSAVAR (var);
1565 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1567 if (is_global_var (var))
1568 return 0;
1570 /* Because we don't know if VAR will be in register or on stack,
1571 we conservatively assume it will be on stack even if VAR is
1572 eventually put into register after RA pass. For non-automatic
1573 variables, which won't be on stack, we collect alignment of
1574 type and ignore user specified alignment. Similarly for
1575 SSA_NAMEs for which use_register_for_decl returns true. */
1576 if (TREE_STATIC (var)
1577 || DECL_EXTERNAL (var)
1578 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1579 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1580 TYPE_MODE (TREE_TYPE (var)),
1581 TYPE_ALIGN (TREE_TYPE (var)));
1582 else if (DECL_HAS_VALUE_EXPR_P (var)
1583 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1584 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1585 or variables which were assigned a stack slot already by
1586 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1587 changed from the offset chosen to it. */
1588 align = crtl->stack_alignment_estimated;
1589 else
1590 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1592 /* If the variable alignment is very large we'll dynamicaly allocate
1593 it, which means that in-frame portion is just a pointer. */
1594 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1595 align = POINTER_SIZE;
1598 record_alignment_for_reg_var (align);
1600 if (TREE_CODE (origvar) == SSA_NAME)
1602 gcc_assert (!VAR_P (var)
1603 || (!DECL_EXTERNAL (var)
1604 && !DECL_HAS_VALUE_EXPR_P (var)
1605 && !TREE_STATIC (var)
1606 && TREE_TYPE (var) != error_mark_node
1607 && !DECL_HARD_REGISTER (var)
1608 && really_expand));
1610 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1612 else if (DECL_EXTERNAL (var))
1614 else if (DECL_HAS_VALUE_EXPR_P (var))
1616 else if (TREE_STATIC (var))
1618 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1620 else if (TREE_TYPE (var) == error_mark_node)
1622 if (really_expand)
1623 expand_one_error_var (var);
1625 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1627 if (really_expand)
1629 expand_one_hard_reg_var (var);
1630 if (!DECL_HARD_REGISTER (var))
1631 /* Invalid register specification. */
1632 expand_one_error_var (var);
1635 else if (use_register_for_decl (var))
1637 if (really_expand)
1638 expand_one_register_var (origvar);
1640 else if (! valid_constant_size_p (DECL_SIZE_UNIT (var)))
1642 /* Reject variables which cover more than half of the address-space. */
1643 if (really_expand)
1645 error ("size of variable %q+D is too large", var);
1646 expand_one_error_var (var);
1649 else if (defer_stack_allocation (var, toplevel))
1650 add_stack_var (origvar);
1651 else
1653 if (really_expand)
1655 if (lookup_attribute ("naked",
1656 DECL_ATTRIBUTES (current_function_decl)))
1657 error ("cannot allocate stack for variable %q+D, naked function.",
1658 var);
1660 expand_one_stack_var (origvar);
1664 return tree_to_uhwi (DECL_SIZE_UNIT (var));
1666 return 0;
1669 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1670 expanding variables. Those variables that can be put into registers
1671 are allocated pseudos; those that can't are put on the stack.
1673 TOPLEVEL is true if this is the outermost BLOCK. */
1675 static void
1676 expand_used_vars_for_block (tree block, bool toplevel)
1678 tree t;
1680 /* Expand all variables at this level. */
1681 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1682 if (TREE_USED (t)
1683 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1684 || !DECL_NONSHAREABLE (t)))
1685 expand_one_var (t, toplevel, true);
1687 /* Expand all variables at containing levels. */
1688 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1689 expand_used_vars_for_block (t, false);
1692 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1693 and clear TREE_USED on all local variables. */
1695 static void
1696 clear_tree_used (tree block)
1698 tree t;
1700 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1701 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1702 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1703 || !DECL_NONSHAREABLE (t))
1704 TREE_USED (t) = 0;
1706 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1707 clear_tree_used (t);
1710 enum {
1711 SPCT_FLAG_DEFAULT = 1,
1712 SPCT_FLAG_ALL = 2,
1713 SPCT_FLAG_STRONG = 3,
1714 SPCT_FLAG_EXPLICIT = 4
1717 /* Examine TYPE and determine a bit mask of the following features. */
1719 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1720 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1721 #define SPCT_HAS_ARRAY 4
1722 #define SPCT_HAS_AGGREGATE 8
1724 static unsigned int
1725 stack_protect_classify_type (tree type)
1727 unsigned int ret = 0;
1728 tree t;
1730 switch (TREE_CODE (type))
1732 case ARRAY_TYPE:
1733 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1734 if (t == char_type_node
1735 || t == signed_char_type_node
1736 || t == unsigned_char_type_node)
1738 unsigned HOST_WIDE_INT max = PARAM_VALUE (PARAM_SSP_BUFFER_SIZE);
1739 unsigned HOST_WIDE_INT len;
1741 if (!TYPE_SIZE_UNIT (type)
1742 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1743 len = max;
1744 else
1745 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1747 if (len < max)
1748 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1749 else
1750 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1752 else
1753 ret = SPCT_HAS_ARRAY;
1754 break;
1756 case UNION_TYPE:
1757 case QUAL_UNION_TYPE:
1758 case RECORD_TYPE:
1759 ret = SPCT_HAS_AGGREGATE;
1760 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1761 if (TREE_CODE (t) == FIELD_DECL)
1762 ret |= stack_protect_classify_type (TREE_TYPE (t));
1763 break;
1765 default:
1766 break;
1769 return ret;
1772 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1773 part of the local stack frame. Remember if we ever return nonzero for
1774 any variable in this function. The return value is the phase number in
1775 which the variable should be allocated. */
1777 static int
1778 stack_protect_decl_phase (tree decl)
1780 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1781 int ret = 0;
1783 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1784 has_short_buffer = true;
1786 if (flag_stack_protect == SPCT_FLAG_ALL
1787 || flag_stack_protect == SPCT_FLAG_STRONG
1788 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1789 && lookup_attribute ("stack_protect",
1790 DECL_ATTRIBUTES (current_function_decl))))
1792 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1793 && !(bits & SPCT_HAS_AGGREGATE))
1794 ret = 1;
1795 else if (bits & SPCT_HAS_ARRAY)
1796 ret = 2;
1798 else
1799 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1801 if (ret)
1802 has_protected_decls = true;
1804 return ret;
1807 /* Two helper routines that check for phase 1 and phase 2. These are used
1808 as callbacks for expand_stack_vars. */
1810 static bool
1811 stack_protect_decl_phase_1 (size_t i)
1813 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1816 static bool
1817 stack_protect_decl_phase_2 (size_t i)
1819 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1822 /* And helper function that checks for asan phase (with stack protector
1823 it is phase 3). This is used as callback for expand_stack_vars.
1824 Returns true if any of the vars in the partition need to be protected. */
1826 static bool
1827 asan_decl_phase_3 (size_t i)
1829 while (i != EOC)
1831 if (asan_protect_stack_decl (stack_vars[i].decl))
1832 return true;
1833 i = stack_vars[i].next;
1835 return false;
1838 /* Ensure that variables in different stack protection phases conflict
1839 so that they are not merged and share the same stack slot. */
1841 static void
1842 add_stack_protection_conflicts (void)
1844 size_t i, j, n = stack_vars_num;
1845 unsigned char *phase;
1847 phase = XNEWVEC (unsigned char, n);
1848 for (i = 0; i < n; ++i)
1849 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1851 for (i = 0; i < n; ++i)
1853 unsigned char ph_i = phase[i];
1854 for (j = i + 1; j < n; ++j)
1855 if (ph_i != phase[j])
1856 add_stack_var_conflict (i, j);
1859 XDELETEVEC (phase);
1862 /* Create a decl for the guard at the top of the stack frame. */
1864 static void
1865 create_stack_guard (void)
1867 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1868 VAR_DECL, NULL, ptr_type_node);
1869 TREE_THIS_VOLATILE (guard) = 1;
1870 TREE_USED (guard) = 1;
1871 expand_one_stack_var (guard);
1872 crtl->stack_protect_guard = guard;
1875 /* Prepare for expanding variables. */
1876 static void
1877 init_vars_expansion (void)
1879 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1880 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1882 /* A map from decl to stack partition. */
1883 decl_to_stack_part = new hash_map<tree, size_t>;
1885 /* Initialize local stack smashing state. */
1886 has_protected_decls = false;
1887 has_short_buffer = false;
1890 /* Free up stack variable graph data. */
1891 static void
1892 fini_vars_expansion (void)
1894 bitmap_obstack_release (&stack_var_bitmap_obstack);
1895 if (stack_vars)
1896 XDELETEVEC (stack_vars);
1897 if (stack_vars_sorted)
1898 XDELETEVEC (stack_vars_sorted);
1899 stack_vars = NULL;
1900 stack_vars_sorted = NULL;
1901 stack_vars_alloc = stack_vars_num = 0;
1902 delete decl_to_stack_part;
1903 decl_to_stack_part = NULL;
1906 /* Make a fair guess for the size of the stack frame of the function
1907 in NODE. This doesn't have to be exact, the result is only used in
1908 the inline heuristics. So we don't want to run the full stack var
1909 packing algorithm (which is quadratic in the number of stack vars).
1910 Instead, we calculate the total size of all stack vars. This turns
1911 out to be a pretty fair estimate -- packing of stack vars doesn't
1912 happen very often. */
1914 HOST_WIDE_INT
1915 estimated_stack_frame_size (struct cgraph_node *node)
1917 HOST_WIDE_INT size = 0;
1918 size_t i;
1919 tree var;
1920 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1922 push_cfun (fn);
1924 init_vars_expansion ();
1926 FOR_EACH_LOCAL_DECL (fn, i, var)
1927 if (auto_var_in_fn_p (var, fn->decl))
1928 size += expand_one_var (var, true, false);
1930 if (stack_vars_num > 0)
1932 /* Fake sorting the stack vars for account_stack_vars (). */
1933 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1934 for (i = 0; i < stack_vars_num; ++i)
1935 stack_vars_sorted[i] = i;
1936 size += account_stack_vars ();
1939 fini_vars_expansion ();
1940 pop_cfun ();
1941 return size;
1944 /* Helper routine to check if a record or union contains an array field. */
1946 static int
1947 record_or_union_type_has_array_p (const_tree tree_type)
1949 tree fields = TYPE_FIELDS (tree_type);
1950 tree f;
1952 for (f = fields; f; f = DECL_CHAIN (f))
1953 if (TREE_CODE (f) == FIELD_DECL)
1955 tree field_type = TREE_TYPE (f);
1956 if (RECORD_OR_UNION_TYPE_P (field_type)
1957 && record_or_union_type_has_array_p (field_type))
1958 return 1;
1959 if (TREE_CODE (field_type) == ARRAY_TYPE)
1960 return 1;
1962 return 0;
1965 /* Check if the current function has local referenced variables that
1966 have their addresses taken, contain an array, or are arrays. */
1968 static bool
1969 stack_protect_decl_p ()
1971 unsigned i;
1972 tree var;
1974 FOR_EACH_LOCAL_DECL (cfun, i, var)
1975 if (!is_global_var (var))
1977 tree var_type = TREE_TYPE (var);
1978 if (VAR_P (var)
1979 && (TREE_CODE (var_type) == ARRAY_TYPE
1980 || TREE_ADDRESSABLE (var)
1981 || (RECORD_OR_UNION_TYPE_P (var_type)
1982 && record_or_union_type_has_array_p (var_type))))
1983 return true;
1985 return false;
1988 /* Check if the current function has calls that use a return slot. */
1990 static bool
1991 stack_protect_return_slot_p ()
1993 basic_block bb;
1995 FOR_ALL_BB_FN (bb, cfun)
1996 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
1997 !gsi_end_p (gsi); gsi_next (&gsi))
1999 gimple *stmt = gsi_stmt (gsi);
2000 /* This assumes that calls to internal-only functions never
2001 use a return slot. */
2002 if (is_gimple_call (stmt)
2003 && !gimple_call_internal_p (stmt)
2004 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2005 gimple_call_fndecl (stmt)))
2006 return true;
2008 return false;
2011 /* Expand all variables used in the function. */
2013 static rtx_insn *
2014 expand_used_vars (void)
2016 tree var, outer_block = DECL_INITIAL (current_function_decl);
2017 auto_vec<tree> maybe_local_decls;
2018 rtx_insn *var_end_seq = NULL;
2019 unsigned i;
2020 unsigned len;
2021 bool gen_stack_protect_signal = false;
2023 /* Compute the phase of the stack frame for this function. */
2025 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2026 int off = STARTING_FRAME_OFFSET % align;
2027 frame_phase = off ? align - off : 0;
2030 /* Set TREE_USED on all variables in the local_decls. */
2031 FOR_EACH_LOCAL_DECL (cfun, i, var)
2032 TREE_USED (var) = 1;
2033 /* Clear TREE_USED on all variables associated with a block scope. */
2034 clear_tree_used (DECL_INITIAL (current_function_decl));
2036 init_vars_expansion ();
2038 if (targetm.use_pseudo_pic_reg ())
2039 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2041 for (i = 0; i < SA.map->num_partitions; i++)
2043 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2044 continue;
2046 tree var = partition_to_var (SA.map, i);
2048 gcc_assert (!virtual_operand_p (var));
2050 expand_one_ssa_partition (var);
2053 if (flag_stack_protect == SPCT_FLAG_STRONG)
2054 gen_stack_protect_signal
2055 = stack_protect_decl_p () || stack_protect_return_slot_p ();
2057 /* At this point all variables on the local_decls with TREE_USED
2058 set are not associated with any block scope. Lay them out. */
2060 len = vec_safe_length (cfun->local_decls);
2061 FOR_EACH_LOCAL_DECL (cfun, i, var)
2063 bool expand_now = false;
2065 /* Expanded above already. */
2066 if (is_gimple_reg (var))
2068 TREE_USED (var) = 0;
2069 goto next;
2071 /* We didn't set a block for static or extern because it's hard
2072 to tell the difference between a global variable (re)declared
2073 in a local scope, and one that's really declared there to
2074 begin with. And it doesn't really matter much, since we're
2075 not giving them stack space. Expand them now. */
2076 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2077 expand_now = true;
2079 /* Expand variables not associated with any block now. Those created by
2080 the optimizers could be live anywhere in the function. Those that
2081 could possibly have been scoped originally and detached from their
2082 block will have their allocation deferred so we coalesce them with
2083 others when optimization is enabled. */
2084 else if (TREE_USED (var))
2085 expand_now = true;
2087 /* Finally, mark all variables on the list as used. We'll use
2088 this in a moment when we expand those associated with scopes. */
2089 TREE_USED (var) = 1;
2091 if (expand_now)
2092 expand_one_var (var, true, true);
2094 next:
2095 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2097 rtx rtl = DECL_RTL_IF_SET (var);
2099 /* Keep artificial non-ignored vars in cfun->local_decls
2100 chain until instantiate_decls. */
2101 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2102 add_local_decl (cfun, var);
2103 else if (rtl == NULL_RTX)
2104 /* If rtl isn't set yet, which can happen e.g. with
2105 -fstack-protector, retry before returning from this
2106 function. */
2107 maybe_local_decls.safe_push (var);
2111 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2113 +-----------------+-----------------+
2114 | ...processed... | ...duplicates...|
2115 +-----------------+-----------------+
2117 +-- LEN points here.
2119 We just want the duplicates, as those are the artificial
2120 non-ignored vars that we want to keep until instantiate_decls.
2121 Move them down and truncate the array. */
2122 if (!vec_safe_is_empty (cfun->local_decls))
2123 cfun->local_decls->block_remove (0, len);
2125 /* At this point, all variables within the block tree with TREE_USED
2126 set are actually used by the optimized function. Lay them out. */
2127 expand_used_vars_for_block (outer_block, true);
2129 if (stack_vars_num > 0)
2131 add_scope_conflicts ();
2133 /* If stack protection is enabled, we don't share space between
2134 vulnerable data and non-vulnerable data. */
2135 if (flag_stack_protect != 0
2136 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2137 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2138 && lookup_attribute ("stack_protect",
2139 DECL_ATTRIBUTES (current_function_decl)))))
2140 add_stack_protection_conflicts ();
2142 /* Now that we have collected all stack variables, and have computed a
2143 minimal interference graph, attempt to save some stack space. */
2144 partition_stack_vars ();
2145 if (dump_file)
2146 dump_stack_var_partition ();
2149 switch (flag_stack_protect)
2151 case SPCT_FLAG_ALL:
2152 create_stack_guard ();
2153 break;
2155 case SPCT_FLAG_STRONG:
2156 if (gen_stack_protect_signal
2157 || cfun->calls_alloca || has_protected_decls
2158 || lookup_attribute ("stack_protect",
2159 DECL_ATTRIBUTES (current_function_decl)))
2160 create_stack_guard ();
2161 break;
2163 case SPCT_FLAG_DEFAULT:
2164 if (cfun->calls_alloca || has_protected_decls
2165 || lookup_attribute ("stack_protect",
2166 DECL_ATTRIBUTES (current_function_decl)))
2167 create_stack_guard ();
2168 break;
2170 case SPCT_FLAG_EXPLICIT:
2171 if (lookup_attribute ("stack_protect",
2172 DECL_ATTRIBUTES (current_function_decl)))
2173 create_stack_guard ();
2174 break;
2175 default:
2179 /* Assign rtl to each variable based on these partitions. */
2180 if (stack_vars_num > 0)
2182 struct stack_vars_data data;
2184 data.asan_base = NULL_RTX;
2185 data.asan_alignb = 0;
2187 /* Reorder decls to be protected by iterating over the variables
2188 array multiple times, and allocating out of each phase in turn. */
2189 /* ??? We could probably integrate this into the qsort we did
2190 earlier, such that we naturally see these variables first,
2191 and thus naturally allocate things in the right order. */
2192 if (has_protected_decls)
2194 /* Phase 1 contains only character arrays. */
2195 expand_stack_vars (stack_protect_decl_phase_1, &data);
2197 /* Phase 2 contains other kinds of arrays. */
2198 if (flag_stack_protect == SPCT_FLAG_ALL
2199 || flag_stack_protect == SPCT_FLAG_STRONG
2200 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2201 && lookup_attribute ("stack_protect",
2202 DECL_ATTRIBUTES (current_function_decl))))
2203 expand_stack_vars (stack_protect_decl_phase_2, &data);
2206 if (asan_sanitize_stack_p ())
2207 /* Phase 3, any partitions that need asan protection
2208 in addition to phase 1 and 2. */
2209 expand_stack_vars (asan_decl_phase_3, &data);
2211 if (!data.asan_vec.is_empty ())
2213 HOST_WIDE_INT prev_offset = frame_offset;
2214 HOST_WIDE_INT offset, sz, redzonesz;
2215 redzonesz = ASAN_RED_ZONE_SIZE;
2216 sz = data.asan_vec[0] - prev_offset;
2217 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2218 && data.asan_alignb <= 4096
2219 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2220 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2221 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2222 offset
2223 = alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE);
2224 data.asan_vec.safe_push (prev_offset);
2225 data.asan_vec.safe_push (offset);
2226 /* Leave space for alignment if STRICT_ALIGNMENT. */
2227 if (STRICT_ALIGNMENT)
2228 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2229 << ASAN_SHADOW_SHIFT)
2230 / BITS_PER_UNIT, 1);
2232 var_end_seq
2233 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2234 data.asan_base,
2235 data.asan_alignb,
2236 data.asan_vec.address (),
2237 data.asan_decl_vec.address (),
2238 data.asan_vec.length ());
2241 expand_stack_vars (NULL, &data);
2244 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2245 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2246 virtual_stack_vars_rtx,
2247 var_end_seq);
2249 fini_vars_expansion ();
2251 /* If there were any artificial non-ignored vars without rtl
2252 found earlier, see if deferred stack allocation hasn't assigned
2253 rtl to them. */
2254 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2256 rtx rtl = DECL_RTL_IF_SET (var);
2258 /* Keep artificial non-ignored vars in cfun->local_decls
2259 chain until instantiate_decls. */
2260 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2261 add_local_decl (cfun, var);
2264 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2265 if (STACK_ALIGNMENT_NEEDED)
2267 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2268 if (!FRAME_GROWS_DOWNWARD)
2269 frame_offset += align - 1;
2270 frame_offset &= -align;
2273 return var_end_seq;
2277 /* If we need to produce a detailed dump, print the tree representation
2278 for STMT to the dump file. SINCE is the last RTX after which the RTL
2279 generated for STMT should have been appended. */
2281 static void
2282 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2284 if (dump_file && (dump_flags & TDF_DETAILS))
2286 fprintf (dump_file, "\n;; ");
2287 print_gimple_stmt (dump_file, stmt, 0,
2288 TDF_SLIM | (dump_flags & TDF_LINENO));
2289 fprintf (dump_file, "\n");
2291 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2295 /* Maps the blocks that do not contain tree labels to rtx labels. */
2297 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2299 /* Returns the label_rtx expression for a label starting basic block BB. */
2301 static rtx_code_label *
2302 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2304 gimple_stmt_iterator gsi;
2305 tree lab;
2307 if (bb->flags & BB_RTL)
2308 return block_label (bb);
2310 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2311 if (elt)
2312 return *elt;
2314 /* Find the tree label if it is present. */
2316 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2318 glabel *lab_stmt;
2320 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2321 if (!lab_stmt)
2322 break;
2324 lab = gimple_label_label (lab_stmt);
2325 if (DECL_NONLOCAL (lab))
2326 break;
2328 return jump_target_rtx (lab);
2331 rtx_code_label *l = gen_label_rtx ();
2332 lab_rtx_for_bb->put (bb, l);
2333 return l;
2337 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2338 of a basic block where we just expanded the conditional at the end,
2339 possibly clean up the CFG and instruction sequence. LAST is the
2340 last instruction before the just emitted jump sequence. */
2342 static void
2343 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2345 /* Special case: when jumpif decides that the condition is
2346 trivial it emits an unconditional jump (and the necessary
2347 barrier). But we still have two edges, the fallthru one is
2348 wrong. purge_dead_edges would clean this up later. Unfortunately
2349 we have to insert insns (and split edges) before
2350 find_many_sub_basic_blocks and hence before purge_dead_edges.
2351 But splitting edges might create new blocks which depend on the
2352 fact that if there are two edges there's no barrier. So the
2353 barrier would get lost and verify_flow_info would ICE. Instead
2354 of auditing all edge splitters to care for the barrier (which
2355 normally isn't there in a cleaned CFG), fix it here. */
2356 if (BARRIER_P (get_last_insn ()))
2358 rtx_insn *insn;
2359 remove_edge (e);
2360 /* Now, we have a single successor block, if we have insns to
2361 insert on the remaining edge we potentially will insert
2362 it at the end of this block (if the dest block isn't feasible)
2363 in order to avoid splitting the edge. This insertion will take
2364 place in front of the last jump. But we might have emitted
2365 multiple jumps (conditional and one unconditional) to the
2366 same destination. Inserting in front of the last one then
2367 is a problem. See PR 40021. We fix this by deleting all
2368 jumps except the last unconditional one. */
2369 insn = PREV_INSN (get_last_insn ());
2370 /* Make sure we have an unconditional jump. Otherwise we're
2371 confused. */
2372 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2373 for (insn = PREV_INSN (insn); insn != last;)
2375 insn = PREV_INSN (insn);
2376 if (JUMP_P (NEXT_INSN (insn)))
2378 if (!any_condjump_p (NEXT_INSN (insn)))
2380 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2381 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2383 delete_insn (NEXT_INSN (insn));
2389 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2390 Returns a new basic block if we've terminated the current basic
2391 block and created a new one. */
2393 static basic_block
2394 expand_gimple_cond (basic_block bb, gcond *stmt)
2396 basic_block new_bb, dest;
2397 edge true_edge;
2398 edge false_edge;
2399 rtx_insn *last2, *last;
2400 enum tree_code code;
2401 tree op0, op1;
2403 code = gimple_cond_code (stmt);
2404 op0 = gimple_cond_lhs (stmt);
2405 op1 = gimple_cond_rhs (stmt);
2406 /* We're sometimes presented with such code:
2407 D.123_1 = x < y;
2408 if (D.123_1 != 0)
2410 This would expand to two comparisons which then later might
2411 be cleaned up by combine. But some pattern matchers like if-conversion
2412 work better when there's only one compare, so make up for this
2413 here as special exception if TER would have made the same change. */
2414 if (SA.values
2415 && TREE_CODE (op0) == SSA_NAME
2416 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2417 && TREE_CODE (op1) == INTEGER_CST
2418 && ((gimple_cond_code (stmt) == NE_EXPR
2419 && integer_zerop (op1))
2420 || (gimple_cond_code (stmt) == EQ_EXPR
2421 && integer_onep (op1)))
2422 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2424 gimple *second = SSA_NAME_DEF_STMT (op0);
2425 if (gimple_code (second) == GIMPLE_ASSIGN)
2427 enum tree_code code2 = gimple_assign_rhs_code (second);
2428 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2430 code = code2;
2431 op0 = gimple_assign_rhs1 (second);
2432 op1 = gimple_assign_rhs2 (second);
2434 /* If jumps are cheap and the target does not support conditional
2435 compare, turn some more codes into jumpy sequences. */
2436 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2437 && targetm.gen_ccmp_first == NULL)
2439 if ((code2 == BIT_AND_EXPR
2440 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2441 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2442 || code2 == TRUTH_AND_EXPR)
2444 code = TRUTH_ANDIF_EXPR;
2445 op0 = gimple_assign_rhs1 (second);
2446 op1 = gimple_assign_rhs2 (second);
2448 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2450 code = TRUTH_ORIF_EXPR;
2451 op0 = gimple_assign_rhs1 (second);
2452 op1 = gimple_assign_rhs2 (second);
2458 last2 = last = get_last_insn ();
2460 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2461 set_curr_insn_location (gimple_location (stmt));
2463 /* These flags have no purpose in RTL land. */
2464 true_edge->flags &= ~EDGE_TRUE_VALUE;
2465 false_edge->flags &= ~EDGE_FALSE_VALUE;
2467 /* We can either have a pure conditional jump with one fallthru edge or
2468 two-way jump that needs to be decomposed into two basic blocks. */
2469 if (false_edge->dest == bb->next_bb)
2471 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2472 true_edge->probability);
2473 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2474 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2475 set_curr_insn_location (true_edge->goto_locus);
2476 false_edge->flags |= EDGE_FALLTHRU;
2477 maybe_cleanup_end_of_block (false_edge, last);
2478 return NULL;
2480 if (true_edge->dest == bb->next_bb)
2482 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2483 false_edge->probability);
2484 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2485 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2486 set_curr_insn_location (false_edge->goto_locus);
2487 true_edge->flags |= EDGE_FALLTHRU;
2488 maybe_cleanup_end_of_block (true_edge, last);
2489 return NULL;
2492 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2493 true_edge->probability);
2494 last = get_last_insn ();
2495 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2496 set_curr_insn_location (false_edge->goto_locus);
2497 emit_jump (label_rtx_for_bb (false_edge->dest));
2499 BB_END (bb) = last;
2500 if (BARRIER_P (BB_END (bb)))
2501 BB_END (bb) = PREV_INSN (BB_END (bb));
2502 update_bb_for_insn (bb);
2504 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2505 dest = false_edge->dest;
2506 redirect_edge_succ (false_edge, new_bb);
2507 false_edge->flags |= EDGE_FALLTHRU;
2508 new_bb->count = false_edge->count;
2509 new_bb->frequency = EDGE_FREQUENCY (false_edge);
2510 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2511 add_bb_to_loop (new_bb, loop);
2512 if (loop->latch == bb
2513 && loop->header == dest)
2514 loop->latch = new_bb;
2515 make_single_succ_edge (new_bb, dest, 0);
2516 if (BARRIER_P (BB_END (new_bb)))
2517 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2518 update_bb_for_insn (new_bb);
2520 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2522 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2524 set_curr_insn_location (true_edge->goto_locus);
2525 true_edge->goto_locus = curr_insn_location ();
2528 return new_bb;
2531 /* Mark all calls that can have a transaction restart. */
2533 static void
2534 mark_transaction_restart_calls (gimple *stmt)
2536 struct tm_restart_node dummy;
2537 tm_restart_node **slot;
2539 if (!cfun->gimple_df->tm_restart)
2540 return;
2542 dummy.stmt = stmt;
2543 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2544 if (slot)
2546 struct tm_restart_node *n = *slot;
2547 tree list = n->label_or_list;
2548 rtx_insn *insn;
2550 for (insn = next_real_insn (get_last_insn ());
2551 !CALL_P (insn);
2552 insn = next_real_insn (insn))
2553 continue;
2555 if (TREE_CODE (list) == LABEL_DECL)
2556 add_reg_note (insn, REG_TM, label_rtx (list));
2557 else
2558 for (; list ; list = TREE_CHAIN (list))
2559 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2563 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2564 statement STMT. */
2566 static void
2567 expand_call_stmt (gcall *stmt)
2569 tree exp, decl, lhs;
2570 bool builtin_p;
2571 size_t i;
2573 if (gimple_call_internal_p (stmt))
2575 expand_internal_call (stmt);
2576 return;
2579 /* If this is a call to a built-in function and it has no effect other
2580 than setting the lhs, try to implement it using an internal function
2581 instead. */
2582 decl = gimple_call_fndecl (stmt);
2583 if (gimple_call_lhs (stmt)
2584 && !gimple_has_side_effects (stmt)
2585 && (optimize || (decl && called_as_built_in (decl))))
2587 internal_fn ifn = replacement_internal_fn (stmt);
2588 if (ifn != IFN_LAST)
2590 expand_internal_call (ifn, stmt);
2591 return;
2595 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2597 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2598 builtin_p = decl && DECL_BUILT_IN (decl);
2600 /* If this is not a builtin function, the function type through which the
2601 call is made may be different from the type of the function. */
2602 if (!builtin_p)
2603 CALL_EXPR_FN (exp)
2604 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2605 CALL_EXPR_FN (exp));
2607 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2608 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2610 for (i = 0; i < gimple_call_num_args (stmt); i++)
2612 tree arg = gimple_call_arg (stmt, i);
2613 gimple *def;
2614 /* TER addresses into arguments of builtin functions so we have a
2615 chance to infer more correct alignment information. See PR39954. */
2616 if (builtin_p
2617 && TREE_CODE (arg) == SSA_NAME
2618 && (def = get_gimple_for_ssa_name (arg))
2619 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2620 arg = gimple_assign_rhs1 (def);
2621 CALL_EXPR_ARG (exp, i) = arg;
2624 if (gimple_has_side_effects (stmt))
2625 TREE_SIDE_EFFECTS (exp) = 1;
2627 if (gimple_call_nothrow_p (stmt))
2628 TREE_NOTHROW (exp) = 1;
2630 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2631 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2632 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2633 if (decl
2634 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
2635 && (DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA
2636 || DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA_WITH_ALIGN))
2637 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2638 else
2639 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2640 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2641 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2642 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2643 CALL_WITH_BOUNDS_P (exp) = gimple_call_with_bounds_p (stmt);
2645 /* Ensure RTL is created for debug args. */
2646 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2648 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2649 unsigned int ix;
2650 tree dtemp;
2652 if (debug_args)
2653 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2655 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2656 expand_debug_expr (dtemp);
2660 lhs = gimple_call_lhs (stmt);
2661 if (lhs)
2662 expand_assignment (lhs, exp, false);
2663 else
2664 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2666 mark_transaction_restart_calls (stmt);
2670 /* Generate RTL for an asm statement (explicit assembler code).
2671 STRING is a STRING_CST node containing the assembler code text,
2672 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2673 insn is volatile; don't optimize it. */
2675 static void
2676 expand_asm_loc (tree string, int vol, location_t locus)
2678 rtx body;
2680 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2681 ggc_strdup (TREE_STRING_POINTER (string)),
2682 locus);
2684 MEM_VOLATILE_P (body) = vol;
2686 /* Non-empty basic ASM implicitly clobbers memory. */
2687 if (TREE_STRING_LENGTH (string) != 0)
2689 rtx asm_op, clob;
2690 unsigned i, nclobbers;
2691 auto_vec<rtx> input_rvec, output_rvec;
2692 auto_vec<const char *> constraints;
2693 auto_vec<rtx> clobber_rvec;
2694 HARD_REG_SET clobbered_regs;
2695 CLEAR_HARD_REG_SET (clobbered_regs);
2697 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2698 clobber_rvec.safe_push (clob);
2700 if (targetm.md_asm_adjust)
2701 targetm.md_asm_adjust (output_rvec, input_rvec,
2702 constraints, clobber_rvec,
2703 clobbered_regs);
2705 asm_op = body;
2706 nclobbers = clobber_rvec.length ();
2707 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nclobbers));
2709 XVECEXP (body, 0, 0) = asm_op;
2710 for (i = 0; i < nclobbers; i++)
2711 XVECEXP (body, 0, i + 1) = gen_rtx_CLOBBER (VOIDmode, clobber_rvec[i]);
2714 emit_insn (body);
2717 /* Return the number of times character C occurs in string S. */
2718 static int
2719 n_occurrences (int c, const char *s)
2721 int n = 0;
2722 while (*s)
2723 n += (*s++ == c);
2724 return n;
2727 /* A subroutine of expand_asm_operands. Check that all operands have
2728 the same number of alternatives. Return true if so. */
2730 static bool
2731 check_operand_nalternatives (const vec<const char *> &constraints)
2733 unsigned len = constraints.length();
2734 if (len > 0)
2736 int nalternatives = n_occurrences (',', constraints[0]);
2738 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2740 error ("too many alternatives in %<asm%>");
2741 return false;
2744 for (unsigned i = 1; i < len; ++i)
2745 if (n_occurrences (',', constraints[i]) != nalternatives)
2747 error ("operand constraints for %<asm%> differ "
2748 "in number of alternatives");
2749 return false;
2752 return true;
2755 /* Check for overlap between registers marked in CLOBBERED_REGS and
2756 anything inappropriate in T. Emit error and return the register
2757 variable definition for error, NULL_TREE for ok. */
2759 static bool
2760 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2762 /* Conflicts between asm-declared register variables and the clobber
2763 list are not allowed. */
2764 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2766 if (overlap)
2768 error ("asm-specifier for variable %qE conflicts with asm clobber list",
2769 DECL_NAME (overlap));
2771 /* Reset registerness to stop multiple errors emitted for a single
2772 variable. */
2773 DECL_REGISTER (overlap) = 0;
2774 return true;
2777 return false;
2780 /* Generate RTL for an asm statement with arguments.
2781 STRING is the instruction template.
2782 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2783 Each output or input has an expression in the TREE_VALUE and
2784 a tree list in TREE_PURPOSE which in turn contains a constraint
2785 name in TREE_VALUE (or NULL_TREE) and a constraint string
2786 in TREE_PURPOSE.
2787 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2788 that is clobbered by this insn.
2790 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2791 should be the fallthru basic block of the asm goto.
2793 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2794 Some elements of OUTPUTS may be replaced with trees representing temporary
2795 values. The caller should copy those temporary values to the originally
2796 specified lvalues.
2798 VOL nonzero means the insn is volatile; don't optimize it. */
2800 static void
2801 expand_asm_stmt (gasm *stmt)
2803 class save_input_location
2805 location_t old;
2807 public:
2808 explicit save_input_location(location_t where)
2810 old = input_location;
2811 input_location = where;
2814 ~save_input_location()
2816 input_location = old;
2820 location_t locus = gimple_location (stmt);
2822 if (gimple_asm_input_p (stmt))
2824 const char *s = gimple_asm_string (stmt);
2825 tree string = build_string (strlen (s), s);
2826 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
2827 return;
2830 /* There are some legacy diagnostics in here, and also avoids a
2831 sixth parameger to targetm.md_asm_adjust. */
2832 save_input_location s_i_l(locus);
2834 unsigned noutputs = gimple_asm_noutputs (stmt);
2835 unsigned ninputs = gimple_asm_ninputs (stmt);
2836 unsigned nlabels = gimple_asm_nlabels (stmt);
2837 unsigned i;
2839 /* ??? Diagnose during gimplification? */
2840 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
2842 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2843 return;
2846 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
2847 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
2848 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
2850 /* Copy the gimple vectors into new vectors that we can manipulate. */
2852 output_tvec.safe_grow (noutputs);
2853 input_tvec.safe_grow (ninputs);
2854 constraints.safe_grow (noutputs + ninputs);
2856 for (i = 0; i < noutputs; ++i)
2858 tree t = gimple_asm_output_op (stmt, i);
2859 output_tvec[i] = TREE_VALUE (t);
2860 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2862 for (i = 0; i < ninputs; i++)
2864 tree t = gimple_asm_input_op (stmt, i);
2865 input_tvec[i] = TREE_VALUE (t);
2866 constraints[i + noutputs]
2867 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2870 /* ??? Diagnose during gimplification? */
2871 if (! check_operand_nalternatives (constraints))
2872 return;
2874 /* Count the number of meaningful clobbered registers, ignoring what
2875 we would ignore later. */
2876 auto_vec<rtx> clobber_rvec;
2877 HARD_REG_SET clobbered_regs;
2878 CLEAR_HARD_REG_SET (clobbered_regs);
2880 if (unsigned n = gimple_asm_nclobbers (stmt))
2882 clobber_rvec.reserve (n);
2883 for (i = 0; i < n; i++)
2885 tree t = gimple_asm_clobber_op (stmt, i);
2886 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
2887 int nregs, j;
2889 j = decode_reg_name_and_count (regname, &nregs);
2890 if (j < 0)
2892 if (j == -2)
2894 /* ??? Diagnose during gimplification? */
2895 error ("unknown register name %qs in %<asm%>", regname);
2897 else if (j == -4)
2899 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2900 clobber_rvec.safe_push (x);
2902 else
2904 /* Otherwise we should have -1 == empty string
2905 or -3 == cc, which is not a register. */
2906 gcc_assert (j == -1 || j == -3);
2909 else
2910 for (int reg = j; reg < j + nregs; reg++)
2912 /* Clobbering the PIC register is an error. */
2913 if (reg == (int) PIC_OFFSET_TABLE_REGNUM)
2915 /* ??? Diagnose during gimplification? */
2916 error ("PIC register clobbered by %qs in %<asm%>",
2917 regname);
2918 return;
2921 SET_HARD_REG_BIT (clobbered_regs, reg);
2922 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
2923 clobber_rvec.safe_push (x);
2927 unsigned nclobbers = clobber_rvec.length();
2929 /* First pass over inputs and outputs checks validity and sets
2930 mark_addressable if needed. */
2931 /* ??? Diagnose during gimplification? */
2933 for (i = 0; i < noutputs; ++i)
2935 tree val = output_tvec[i];
2936 tree type = TREE_TYPE (val);
2937 const char *constraint;
2938 bool is_inout;
2939 bool allows_reg;
2940 bool allows_mem;
2942 /* Try to parse the output constraint. If that fails, there's
2943 no point in going further. */
2944 constraint = constraints[i];
2945 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
2946 &allows_mem, &allows_reg, &is_inout))
2947 return;
2949 if (! allows_reg
2950 && (allows_mem
2951 || is_inout
2952 || (DECL_P (val)
2953 && REG_P (DECL_RTL (val))
2954 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
2955 mark_addressable (val);
2958 for (i = 0; i < ninputs; ++i)
2960 bool allows_reg, allows_mem;
2961 const char *constraint;
2963 constraint = constraints[i + noutputs];
2964 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
2965 constraints.address (),
2966 &allows_mem, &allows_reg))
2967 return;
2969 if (! allows_reg && allows_mem)
2970 mark_addressable (input_tvec[i]);
2973 /* Second pass evaluates arguments. */
2975 /* Make sure stack is consistent for asm goto. */
2976 if (nlabels > 0)
2977 do_pending_stack_adjust ();
2978 int old_generating_concat_p = generating_concat_p;
2980 /* Vector of RTX's of evaluated output operands. */
2981 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
2982 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
2983 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
2985 output_rvec.safe_grow (noutputs);
2987 for (i = 0; i < noutputs; ++i)
2989 tree val = output_tvec[i];
2990 tree type = TREE_TYPE (val);
2991 bool is_inout, allows_reg, allows_mem, ok;
2992 rtx op;
2994 ok = parse_output_constraint (&constraints[i], i, ninputs,
2995 noutputs, &allows_mem, &allows_reg,
2996 &is_inout);
2997 gcc_assert (ok);
2999 /* If an output operand is not a decl or indirect ref and our constraint
3000 allows a register, make a temporary to act as an intermediate.
3001 Make the asm insn write into that, then we will copy it to
3002 the real output operand. Likewise for promoted variables. */
3004 generating_concat_p = 0;
3006 if ((TREE_CODE (val) == INDIRECT_REF
3007 && allows_mem)
3008 || (DECL_P (val)
3009 && (allows_mem || REG_P (DECL_RTL (val)))
3010 && ! (REG_P (DECL_RTL (val))
3011 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3012 || ! allows_reg
3013 || is_inout)
3015 op = expand_expr (val, NULL_RTX, VOIDmode,
3016 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3017 if (MEM_P (op))
3018 op = validize_mem (op);
3020 if (! allows_reg && !MEM_P (op))
3021 error ("output number %d not directly addressable", i);
3022 if ((! allows_mem && MEM_P (op))
3023 || GET_CODE (op) == CONCAT)
3025 rtx old_op = op;
3026 op = gen_reg_rtx (GET_MODE (op));
3028 generating_concat_p = old_generating_concat_p;
3030 if (is_inout)
3031 emit_move_insn (op, old_op);
3033 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3034 emit_move_insn (old_op, op);
3035 after_rtl_seq = get_insns ();
3036 after_rtl_end = get_last_insn ();
3037 end_sequence ();
3040 else
3042 op = assign_temp (type, 0, 1);
3043 op = validize_mem (op);
3044 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3045 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3047 generating_concat_p = old_generating_concat_p;
3049 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3050 expand_assignment (val, make_tree (type, op), false);
3051 after_rtl_seq = get_insns ();
3052 after_rtl_end = get_last_insn ();
3053 end_sequence ();
3055 output_rvec[i] = op;
3057 if (is_inout)
3058 inout_opnum.safe_push (i);
3061 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3062 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3064 input_rvec.safe_grow (ninputs);
3065 input_mode.safe_grow (ninputs);
3067 generating_concat_p = 0;
3069 for (i = 0; i < ninputs; ++i)
3071 tree val = input_tvec[i];
3072 tree type = TREE_TYPE (val);
3073 bool allows_reg, allows_mem, ok;
3074 const char *constraint;
3075 rtx op;
3077 constraint = constraints[i + noutputs];
3078 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3079 constraints.address (),
3080 &allows_mem, &allows_reg);
3081 gcc_assert (ok);
3083 /* EXPAND_INITIALIZER will not generate code for valid initializer
3084 constants, but will still generate code for other types of operand.
3085 This is the behavior we want for constant constraints. */
3086 op = expand_expr (val, NULL_RTX, VOIDmode,
3087 allows_reg ? EXPAND_NORMAL
3088 : allows_mem ? EXPAND_MEMORY
3089 : EXPAND_INITIALIZER);
3091 /* Never pass a CONCAT to an ASM. */
3092 if (GET_CODE (op) == CONCAT)
3093 op = force_reg (GET_MODE (op), op);
3094 else if (MEM_P (op))
3095 op = validize_mem (op);
3097 if (asm_operand_ok (op, constraint, NULL) <= 0)
3099 if (allows_reg && TYPE_MODE (type) != BLKmode)
3100 op = force_reg (TYPE_MODE (type), op);
3101 else if (!allows_mem)
3102 warning (0, "asm operand %d probably doesn%'t match constraints",
3103 i + noutputs);
3104 else if (MEM_P (op))
3106 /* We won't recognize either volatile memory or memory
3107 with a queued address as available a memory_operand
3108 at this point. Ignore it: clearly this *is* a memory. */
3110 else
3111 gcc_unreachable ();
3113 input_rvec[i] = op;
3114 input_mode[i] = TYPE_MODE (type);
3117 /* For in-out operands, copy output rtx to input rtx. */
3118 unsigned ninout = inout_opnum.length();
3119 for (i = 0; i < ninout; i++)
3121 int j = inout_opnum[i];
3122 rtx o = output_rvec[j];
3124 input_rvec.safe_push (o);
3125 input_mode.safe_push (GET_MODE (o));
3127 char buffer[16];
3128 sprintf (buffer, "%d", j);
3129 constraints.safe_push (ggc_strdup (buffer));
3131 ninputs += ninout;
3133 /* Sometimes we wish to automatically clobber registers across an asm.
3134 Case in point is when the i386 backend moved from cc0 to a hard reg --
3135 maintaining source-level compatibility means automatically clobbering
3136 the flags register. */
3137 rtx_insn *after_md_seq = NULL;
3138 if (targetm.md_asm_adjust)
3139 after_md_seq = targetm.md_asm_adjust (output_rvec, input_rvec,
3140 constraints, clobber_rvec,
3141 clobbered_regs);
3143 /* Do not allow the hook to change the output and input count,
3144 lest it mess up the operand numbering. */
3145 gcc_assert (output_rvec.length() == noutputs);
3146 gcc_assert (input_rvec.length() == ninputs);
3147 gcc_assert (constraints.length() == noutputs + ninputs);
3149 /* But it certainly can adjust the clobbers. */
3150 nclobbers = clobber_rvec.length();
3152 /* Third pass checks for easy conflicts. */
3153 /* ??? Why are we doing this on trees instead of rtx. */
3155 bool clobber_conflict_found = 0;
3156 for (i = 0; i < noutputs; ++i)
3157 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3158 clobber_conflict_found = 1;
3159 for (i = 0; i < ninputs - ninout; ++i)
3160 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3161 clobber_conflict_found = 1;
3163 /* Make vectors for the expression-rtx, constraint strings,
3164 and named operands. */
3166 rtvec argvec = rtvec_alloc (ninputs);
3167 rtvec constraintvec = rtvec_alloc (ninputs);
3168 rtvec labelvec = rtvec_alloc (nlabels);
3170 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3171 : GET_MODE (output_rvec[0])),
3172 ggc_strdup (gimple_asm_string (stmt)),
3173 "", 0, argvec, constraintvec,
3174 labelvec, locus);
3175 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3177 for (i = 0; i < ninputs; ++i)
3179 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3180 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3181 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3182 constraints[i + noutputs],
3183 locus);
3186 /* Copy labels to the vector. */
3187 rtx_code_label *fallthru_label = NULL;
3188 if (nlabels > 0)
3190 basic_block fallthru_bb = NULL;
3191 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3192 if (fallthru)
3193 fallthru_bb = fallthru->dest;
3195 for (i = 0; i < nlabels; ++i)
3197 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3198 rtx_insn *r;
3199 /* If asm goto has any labels in the fallthru basic block, use
3200 a label that we emit immediately after the asm goto. Expansion
3201 may insert further instructions into the same basic block after
3202 asm goto and if we don't do this, insertion of instructions on
3203 the fallthru edge might misbehave. See PR58670. */
3204 if (fallthru_bb && label_to_block_fn (cfun, label) == fallthru_bb)
3206 if (fallthru_label == NULL_RTX)
3207 fallthru_label = gen_label_rtx ();
3208 r = fallthru_label;
3210 else
3211 r = label_rtx (label);
3212 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3216 /* Now, for each output, construct an rtx
3217 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3218 ARGVEC CONSTRAINTS OPNAMES))
3219 If there is more than one, put them inside a PARALLEL. */
3221 if (nlabels > 0 && nclobbers == 0)
3223 gcc_assert (noutputs == 0);
3224 emit_jump_insn (body);
3226 else if (noutputs == 0 && nclobbers == 0)
3228 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3229 emit_insn (body);
3231 else if (noutputs == 1 && nclobbers == 0)
3233 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3234 emit_insn (gen_rtx_SET (output_rvec[0], body));
3236 else
3238 rtx obody = body;
3239 int num = noutputs;
3241 if (num == 0)
3242 num = 1;
3244 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3246 /* For each output operand, store a SET. */
3247 for (i = 0; i < noutputs; ++i)
3249 rtx src, o = output_rvec[i];
3250 if (i == 0)
3252 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3253 src = obody;
3255 else
3257 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3258 ASM_OPERANDS_TEMPLATE (obody),
3259 constraints[i], i, argvec,
3260 constraintvec, labelvec, locus);
3261 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3263 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3266 /* If there are no outputs (but there are some clobbers)
3267 store the bare ASM_OPERANDS into the PARALLEL. */
3268 if (i == 0)
3269 XVECEXP (body, 0, i++) = obody;
3271 /* Store (clobber REG) for each clobbered register specified. */
3272 for (unsigned j = 0; j < nclobbers; ++j)
3274 rtx clobbered_reg = clobber_rvec[j];
3276 /* Do sanity check for overlap between clobbers and respectively
3277 input and outputs that hasn't been handled. Such overlap
3278 should have been detected and reported above. */
3279 if (!clobber_conflict_found && REG_P (clobbered_reg))
3281 /* We test the old body (obody) contents to avoid
3282 tripping over the under-construction body. */
3283 for (unsigned k = 0; k < noutputs; ++k)
3284 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3285 internal_error ("asm clobber conflict with output operand");
3287 for (unsigned k = 0; k < ninputs - ninout; ++k)
3288 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3289 internal_error ("asm clobber conflict with input operand");
3292 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3295 if (nlabels > 0)
3296 emit_jump_insn (body);
3297 else
3298 emit_insn (body);
3301 generating_concat_p = old_generating_concat_p;
3303 if (fallthru_label)
3304 emit_label (fallthru_label);
3306 if (after_md_seq)
3307 emit_insn (after_md_seq);
3308 if (after_rtl_seq)
3309 emit_insn (after_rtl_seq);
3311 free_temp_slots ();
3312 crtl->has_asm_statement = 1;
3315 /* Emit code to jump to the address
3316 specified by the pointer expression EXP. */
3318 static void
3319 expand_computed_goto (tree exp)
3321 rtx x = expand_normal (exp);
3323 do_pending_stack_adjust ();
3324 emit_indirect_jump (x);
3327 /* Generate RTL code for a `goto' statement with target label LABEL.
3328 LABEL should be a LABEL_DECL tree node that was or will later be
3329 defined with `expand_label'. */
3331 static void
3332 expand_goto (tree label)
3334 if (flag_checking)
3336 /* Check for a nonlocal goto to a containing function. Should have
3337 gotten translated to __builtin_nonlocal_goto. */
3338 tree context = decl_function_context (label);
3339 gcc_assert (!context || context == current_function_decl);
3342 emit_jump (jump_target_rtx (label));
3345 /* Output a return with no value. */
3347 static void
3348 expand_null_return_1 (void)
3350 clear_pending_stack_adjust ();
3351 do_pending_stack_adjust ();
3352 emit_jump (return_label);
3355 /* Generate RTL to return from the current function, with no value.
3356 (That is, we do not do anything about returning any value.) */
3358 void
3359 expand_null_return (void)
3361 /* If this function was declared to return a value, but we
3362 didn't, clobber the return registers so that they are not
3363 propagated live to the rest of the function. */
3364 clobber_return_register ();
3366 expand_null_return_1 ();
3369 /* Generate RTL to return from the current function, with value VAL. */
3371 static void
3372 expand_value_return (rtx val)
3374 /* Copy the value to the return location unless it's already there. */
3376 tree decl = DECL_RESULT (current_function_decl);
3377 rtx return_reg = DECL_RTL (decl);
3378 if (return_reg != val)
3380 tree funtype = TREE_TYPE (current_function_decl);
3381 tree type = TREE_TYPE (decl);
3382 int unsignedp = TYPE_UNSIGNED (type);
3383 machine_mode old_mode = DECL_MODE (decl);
3384 machine_mode mode;
3385 if (DECL_BY_REFERENCE (decl))
3386 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3387 else
3388 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3390 if (mode != old_mode)
3391 val = convert_modes (mode, old_mode, val, unsignedp);
3393 if (GET_CODE (return_reg) == PARALLEL)
3394 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3395 else
3396 emit_move_insn (return_reg, val);
3399 expand_null_return_1 ();
3402 /* Generate RTL to evaluate the expression RETVAL and return it
3403 from the current function. */
3405 static void
3406 expand_return (tree retval, tree bounds)
3408 rtx result_rtl;
3409 rtx val = 0;
3410 tree retval_rhs;
3411 rtx bounds_rtl;
3413 /* If function wants no value, give it none. */
3414 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3416 expand_normal (retval);
3417 expand_null_return ();
3418 return;
3421 if (retval == error_mark_node)
3423 /* Treat this like a return of no value from a function that
3424 returns a value. */
3425 expand_null_return ();
3426 return;
3428 else if ((TREE_CODE (retval) == MODIFY_EXPR
3429 || TREE_CODE (retval) == INIT_EXPR)
3430 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3431 retval_rhs = TREE_OPERAND (retval, 1);
3432 else
3433 retval_rhs = retval;
3435 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3437 /* Put returned bounds to the right place. */
3438 bounds_rtl = DECL_BOUNDS_RTL (DECL_RESULT (current_function_decl));
3439 if (bounds_rtl)
3441 rtx addr = NULL;
3442 rtx bnd = NULL;
3444 if (bounds && bounds != error_mark_node)
3446 bnd = expand_normal (bounds);
3447 targetm.calls.store_returned_bounds (bounds_rtl, bnd);
3449 else if (REG_P (bounds_rtl))
3451 if (bounds)
3452 bnd = chkp_expand_zero_bounds ();
3453 else
3455 addr = expand_normal (build_fold_addr_expr (retval_rhs));
3456 addr = gen_rtx_MEM (Pmode, addr);
3457 bnd = targetm.calls.load_bounds_for_arg (addr, NULL, NULL);
3460 targetm.calls.store_returned_bounds (bounds_rtl, bnd);
3462 else
3464 int n;
3466 gcc_assert (GET_CODE (bounds_rtl) == PARALLEL);
3468 if (bounds)
3469 bnd = chkp_expand_zero_bounds ();
3470 else
3472 addr = expand_normal (build_fold_addr_expr (retval_rhs));
3473 addr = gen_rtx_MEM (Pmode, addr);
3476 for (n = 0; n < XVECLEN (bounds_rtl, 0); n++)
3478 rtx slot = XEXP (XVECEXP (bounds_rtl, 0, n), 0);
3479 if (!bounds)
3481 rtx offs = XEXP (XVECEXP (bounds_rtl, 0, n), 1);
3482 rtx from = adjust_address (addr, Pmode, INTVAL (offs));
3483 bnd = targetm.calls.load_bounds_for_arg (from, NULL, NULL);
3485 targetm.calls.store_returned_bounds (slot, bnd);
3489 else if (chkp_function_instrumented_p (current_function_decl)
3490 && !BOUNDED_P (retval_rhs)
3491 && chkp_type_has_pointer (TREE_TYPE (retval_rhs))
3492 && TREE_CODE (retval_rhs) != RESULT_DECL)
3494 rtx addr = expand_normal (build_fold_addr_expr (retval_rhs));
3495 addr = gen_rtx_MEM (Pmode, addr);
3497 gcc_assert (MEM_P (result_rtl));
3499 chkp_copy_bounds_for_stack_parm (result_rtl, addr, TREE_TYPE (retval_rhs));
3502 /* If we are returning the RESULT_DECL, then the value has already
3503 been stored into it, so we don't have to do anything special. */
3504 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3505 expand_value_return (result_rtl);
3507 /* If the result is an aggregate that is being returned in one (or more)
3508 registers, load the registers here. */
3510 else if (retval_rhs != 0
3511 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3512 && REG_P (result_rtl))
3514 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3515 if (val)
3517 /* Use the mode of the result value on the return register. */
3518 PUT_MODE (result_rtl, GET_MODE (val));
3519 expand_value_return (val);
3521 else
3522 expand_null_return ();
3524 else if (retval_rhs != 0
3525 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3526 && (REG_P (result_rtl)
3527 || (GET_CODE (result_rtl) == PARALLEL)))
3529 /* Compute the return value into a temporary (usually a pseudo reg). */
3531 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3532 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3533 val = force_not_mem (val);
3534 expand_value_return (val);
3536 else
3538 /* No hard reg used; calculate value into hard return reg. */
3539 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3540 expand_value_return (result_rtl);
3544 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3545 STMT that doesn't require special handling for outgoing edges. That
3546 is no tailcalls and no GIMPLE_COND. */
3548 static void
3549 expand_gimple_stmt_1 (gimple *stmt)
3551 tree op0;
3553 set_curr_insn_location (gimple_location (stmt));
3555 switch (gimple_code (stmt))
3557 case GIMPLE_GOTO:
3558 op0 = gimple_goto_dest (stmt);
3559 if (TREE_CODE (op0) == LABEL_DECL)
3560 expand_goto (op0);
3561 else
3562 expand_computed_goto (op0);
3563 break;
3564 case GIMPLE_LABEL:
3565 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3566 break;
3567 case GIMPLE_NOP:
3568 case GIMPLE_PREDICT:
3569 break;
3570 case GIMPLE_SWITCH:
3572 gswitch *swtch = as_a <gswitch *> (stmt);
3573 if (gimple_switch_num_labels (swtch) == 1)
3574 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3575 else
3576 expand_case (swtch);
3578 break;
3579 case GIMPLE_ASM:
3580 expand_asm_stmt (as_a <gasm *> (stmt));
3581 break;
3582 case GIMPLE_CALL:
3583 expand_call_stmt (as_a <gcall *> (stmt));
3584 break;
3586 case GIMPLE_RETURN:
3588 tree bnd = gimple_return_retbnd (as_a <greturn *> (stmt));
3589 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3591 if (op0 && op0 != error_mark_node)
3593 tree result = DECL_RESULT (current_function_decl);
3595 /* Mark we have return statement with missing bounds. */
3596 if (!bnd
3597 && chkp_function_instrumented_p (cfun->decl)
3598 && !DECL_P (op0))
3599 bnd = error_mark_node;
3601 /* If we are not returning the current function's RESULT_DECL,
3602 build an assignment to it. */
3603 if (op0 != result)
3605 /* I believe that a function's RESULT_DECL is unique. */
3606 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3608 /* ??? We'd like to use simply expand_assignment here,
3609 but this fails if the value is of BLKmode but the return
3610 decl is a register. expand_return has special handling
3611 for this combination, which eventually should move
3612 to common code. See comments there. Until then, let's
3613 build a modify expression :-/ */
3614 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3615 result, op0);
3619 if (!op0)
3620 expand_null_return ();
3621 else
3622 expand_return (op0, bnd);
3624 break;
3626 case GIMPLE_ASSIGN:
3628 gassign *assign_stmt = as_a <gassign *> (stmt);
3629 tree lhs = gimple_assign_lhs (assign_stmt);
3631 /* Tree expand used to fiddle with |= and &= of two bitfield
3632 COMPONENT_REFs here. This can't happen with gimple, the LHS
3633 of binary assigns must be a gimple reg. */
3635 if (TREE_CODE (lhs) != SSA_NAME
3636 || get_gimple_rhs_class (gimple_expr_code (stmt))
3637 == GIMPLE_SINGLE_RHS)
3639 tree rhs = gimple_assign_rhs1 (assign_stmt);
3640 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt))
3641 == GIMPLE_SINGLE_RHS);
3642 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3643 /* Do not put locations on possibly shared trees. */
3644 && !is_gimple_min_invariant (rhs))
3645 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3646 if (TREE_CLOBBER_P (rhs))
3647 /* This is a clobber to mark the going out of scope for
3648 this LHS. */
3650 else
3651 expand_assignment (lhs, rhs,
3652 gimple_assign_nontemporal_move_p (
3653 assign_stmt));
3655 else
3657 rtx target, temp;
3658 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3659 struct separate_ops ops;
3660 bool promoted = false;
3662 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3663 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3664 promoted = true;
3666 ops.code = gimple_assign_rhs_code (assign_stmt);
3667 ops.type = TREE_TYPE (lhs);
3668 switch (get_gimple_rhs_class (ops.code))
3670 case GIMPLE_TERNARY_RHS:
3671 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3672 /* Fallthru */
3673 case GIMPLE_BINARY_RHS:
3674 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3675 /* Fallthru */
3676 case GIMPLE_UNARY_RHS:
3677 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3678 break;
3679 default:
3680 gcc_unreachable ();
3682 ops.location = gimple_location (stmt);
3684 /* If we want to use a nontemporal store, force the value to
3685 register first. If we store into a promoted register,
3686 don't directly expand to target. */
3687 temp = nontemporal || promoted ? NULL_RTX : target;
3688 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3689 EXPAND_NORMAL);
3691 if (temp == target)
3693 else if (promoted)
3695 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3696 /* If TEMP is a VOIDmode constant, use convert_modes to make
3697 sure that we properly convert it. */
3698 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3700 temp = convert_modes (GET_MODE (target),
3701 TYPE_MODE (ops.type),
3702 temp, unsignedp);
3703 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3704 GET_MODE (target), temp, unsignedp);
3707 convert_move (SUBREG_REG (target), temp, unsignedp);
3709 else if (nontemporal && emit_storent_insn (target, temp))
3711 else
3713 temp = force_operand (temp, target);
3714 if (temp != target)
3715 emit_move_insn (target, temp);
3719 break;
3721 default:
3722 gcc_unreachable ();
3726 /* Expand one gimple statement STMT and return the last RTL instruction
3727 before any of the newly generated ones.
3729 In addition to generating the necessary RTL instructions this also
3730 sets REG_EH_REGION notes if necessary and sets the current source
3731 location for diagnostics. */
3733 static rtx_insn *
3734 expand_gimple_stmt (gimple *stmt)
3736 location_t saved_location = input_location;
3737 rtx_insn *last = get_last_insn ();
3738 int lp_nr;
3740 gcc_assert (cfun);
3742 /* We need to save and restore the current source location so that errors
3743 discovered during expansion are emitted with the right location. But
3744 it would be better if the diagnostic routines used the source location
3745 embedded in the tree nodes rather than globals. */
3746 if (gimple_has_location (stmt))
3747 input_location = gimple_location (stmt);
3749 expand_gimple_stmt_1 (stmt);
3751 /* Free any temporaries used to evaluate this statement. */
3752 free_temp_slots ();
3754 input_location = saved_location;
3756 /* Mark all insns that may trap. */
3757 lp_nr = lookup_stmt_eh_lp (stmt);
3758 if (lp_nr)
3760 rtx_insn *insn;
3761 for (insn = next_real_insn (last); insn;
3762 insn = next_real_insn (insn))
3764 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3765 /* If we want exceptions for non-call insns, any
3766 may_trap_p instruction may throw. */
3767 && GET_CODE (PATTERN (insn)) != CLOBBER
3768 && GET_CODE (PATTERN (insn)) != USE
3769 && insn_could_throw_p (insn))
3770 make_reg_eh_region_note (insn, 0, lp_nr);
3774 return last;
3777 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3778 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3779 generated a tail call (something that might be denied by the ABI
3780 rules governing the call; see calls.c).
3782 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3783 can still reach the rest of BB. The case here is __builtin_sqrt,
3784 where the NaN result goes through the external function (with a
3785 tailcall) and the normal result happens via a sqrt instruction. */
3787 static basic_block
3788 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
3790 rtx_insn *last2, *last;
3791 edge e;
3792 edge_iterator ei;
3793 profile_probability probability;
3795 last2 = last = expand_gimple_stmt (stmt);
3797 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3798 if (CALL_P (last) && SIBLING_CALL_P (last))
3799 goto found;
3801 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3803 *can_fallthru = true;
3804 return NULL;
3806 found:
3807 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3808 Any instructions emitted here are about to be deleted. */
3809 do_pending_stack_adjust ();
3811 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3812 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3813 EH or abnormal edges, we shouldn't have created a tail call in
3814 the first place. So it seems to me we should just be removing
3815 all edges here, or redirecting the existing fallthru edge to
3816 the exit block. */
3818 probability = profile_probability::never ();
3819 profile_count count = profile_count::zero ();
3821 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3823 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3825 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3827 e->dest->count -= e->count;
3828 e->dest->frequency -= EDGE_FREQUENCY (e);
3829 if (e->dest->frequency < 0)
3830 e->dest->frequency = 0;
3832 count += e->count;
3833 probability += e->probability;
3834 remove_edge (e);
3836 else
3837 ei_next (&ei);
3840 /* This is somewhat ugly: the call_expr expander often emits instructions
3841 after the sibcall (to perform the function return). These confuse the
3842 find_many_sub_basic_blocks code, so we need to get rid of these. */
3843 last = NEXT_INSN (last);
3844 gcc_assert (BARRIER_P (last));
3846 *can_fallthru = false;
3847 while (NEXT_INSN (last))
3849 /* For instance an sqrt builtin expander expands if with
3850 sibcall in the then and label for `else`. */
3851 if (LABEL_P (NEXT_INSN (last)))
3853 *can_fallthru = true;
3854 break;
3856 delete_insn (NEXT_INSN (last));
3859 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3860 | EDGE_SIBCALL);
3861 e->probability = probability;
3862 e->count = count;
3863 BB_END (bb) = last;
3864 update_bb_for_insn (bb);
3866 if (NEXT_INSN (last))
3868 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3870 last = BB_END (bb);
3871 if (BARRIER_P (last))
3872 BB_END (bb) = PREV_INSN (last);
3875 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3877 return bb;
3880 /* Return the difference between the floor and the truncated result of
3881 a signed division by OP1 with remainder MOD. */
3882 static rtx
3883 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3885 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
3886 return gen_rtx_IF_THEN_ELSE
3887 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3888 gen_rtx_IF_THEN_ELSE
3889 (mode, gen_rtx_LT (BImode,
3890 gen_rtx_DIV (mode, op1, mod),
3891 const0_rtx),
3892 constm1_rtx, const0_rtx),
3893 const0_rtx);
3896 /* Return the difference between the ceil and the truncated result of
3897 a signed division by OP1 with remainder MOD. */
3898 static rtx
3899 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3901 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
3902 return gen_rtx_IF_THEN_ELSE
3903 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3904 gen_rtx_IF_THEN_ELSE
3905 (mode, gen_rtx_GT (BImode,
3906 gen_rtx_DIV (mode, op1, mod),
3907 const0_rtx),
3908 const1_rtx, const0_rtx),
3909 const0_rtx);
3912 /* Return the difference between the ceil and the truncated result of
3913 an unsigned division by OP1 with remainder MOD. */
3914 static rtx
3915 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
3917 /* (mod != 0 ? 1 : 0) */
3918 return gen_rtx_IF_THEN_ELSE
3919 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3920 const1_rtx, const0_rtx);
3923 /* Return the difference between the rounded and the truncated result
3924 of a signed division by OP1 with remainder MOD. Halfway cases are
3925 rounded away from zero, rather than to the nearest even number. */
3926 static rtx
3927 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3929 /* (abs (mod) >= abs (op1) - abs (mod)
3930 ? (op1 / mod > 0 ? 1 : -1)
3931 : 0) */
3932 return gen_rtx_IF_THEN_ELSE
3933 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
3934 gen_rtx_MINUS (mode,
3935 gen_rtx_ABS (mode, op1),
3936 gen_rtx_ABS (mode, mod))),
3937 gen_rtx_IF_THEN_ELSE
3938 (mode, gen_rtx_GT (BImode,
3939 gen_rtx_DIV (mode, op1, mod),
3940 const0_rtx),
3941 const1_rtx, constm1_rtx),
3942 const0_rtx);
3945 /* Return the difference between the rounded and the truncated result
3946 of a unsigned division by OP1 with remainder MOD. Halfway cases
3947 are rounded away from zero, rather than to the nearest even
3948 number. */
3949 static rtx
3950 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
3952 /* (mod >= op1 - mod ? 1 : 0) */
3953 return gen_rtx_IF_THEN_ELSE
3954 (mode, gen_rtx_GE (BImode, mod,
3955 gen_rtx_MINUS (mode, op1, mod)),
3956 const1_rtx, const0_rtx);
3959 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
3960 any rtl. */
3962 static rtx
3963 convert_debug_memory_address (machine_mode mode, rtx x,
3964 addr_space_t as)
3966 machine_mode xmode = GET_MODE (x);
3968 #ifndef POINTERS_EXTEND_UNSIGNED
3969 gcc_assert (mode == Pmode
3970 || mode == targetm.addr_space.address_mode (as));
3971 gcc_assert (xmode == mode || xmode == VOIDmode);
3972 #else
3973 rtx temp;
3975 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
3977 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
3978 return x;
3980 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
3981 x = lowpart_subreg (mode, x, xmode);
3982 else if (POINTERS_EXTEND_UNSIGNED > 0)
3983 x = gen_rtx_ZERO_EXTEND (mode, x);
3984 else if (!POINTERS_EXTEND_UNSIGNED)
3985 x = gen_rtx_SIGN_EXTEND (mode, x);
3986 else
3988 switch (GET_CODE (x))
3990 case SUBREG:
3991 if ((SUBREG_PROMOTED_VAR_P (x)
3992 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
3993 || (GET_CODE (SUBREG_REG (x)) == PLUS
3994 && REG_P (XEXP (SUBREG_REG (x), 0))
3995 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
3996 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
3997 && GET_MODE (SUBREG_REG (x)) == mode)
3998 return SUBREG_REG (x);
3999 break;
4000 case LABEL_REF:
4001 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4002 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4003 return temp;
4004 case SYMBOL_REF:
4005 temp = shallow_copy_rtx (x);
4006 PUT_MODE (temp, mode);
4007 return temp;
4008 case CONST:
4009 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4010 if (temp)
4011 temp = gen_rtx_CONST (mode, temp);
4012 return temp;
4013 case PLUS:
4014 case MINUS:
4015 if (CONST_INT_P (XEXP (x, 1)))
4017 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4018 if (temp)
4019 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4021 break;
4022 default:
4023 break;
4025 /* Don't know how to express ptr_extend as operation in debug info. */
4026 return NULL;
4028 #endif /* POINTERS_EXTEND_UNSIGNED */
4030 return x;
4033 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4034 by avoid_deep_ter_for_debug. */
4036 static hash_map<tree, tree> *deep_ter_debug_map;
4038 /* Split too deep TER chains for debug stmts using debug temporaries. */
4040 static void
4041 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4043 use_operand_p use_p;
4044 ssa_op_iter iter;
4045 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4047 tree use = USE_FROM_PTR (use_p);
4048 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4049 continue;
4050 gimple *g = get_gimple_for_ssa_name (use);
4051 if (g == NULL)
4052 continue;
4053 if (depth > 6 && !stmt_ends_bb_p (g))
4055 if (deep_ter_debug_map == NULL)
4056 deep_ter_debug_map = new hash_map<tree, tree>;
4058 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4059 if (vexpr != NULL)
4060 continue;
4061 vexpr = make_node (DEBUG_EXPR_DECL);
4062 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4063 DECL_ARTIFICIAL (vexpr) = 1;
4064 TREE_TYPE (vexpr) = TREE_TYPE (use);
4065 SET_DECL_MODE (vexpr, TYPE_MODE (TREE_TYPE (use)));
4066 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4067 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4068 avoid_deep_ter_for_debug (def_temp, 0);
4070 else
4071 avoid_deep_ter_for_debug (g, depth + 1);
4075 /* Return an RTX equivalent to the value of the parameter DECL. */
4077 static rtx
4078 expand_debug_parm_decl (tree decl)
4080 rtx incoming = DECL_INCOMING_RTL (decl);
4082 if (incoming
4083 && GET_MODE (incoming) != BLKmode
4084 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4085 || (MEM_P (incoming)
4086 && REG_P (XEXP (incoming, 0))
4087 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4089 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4091 #ifdef HAVE_window_save
4092 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4093 If the target machine has an explicit window save instruction, the
4094 actual entry value is the corresponding OUTGOING_REGNO instead. */
4095 if (REG_P (incoming)
4096 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4097 incoming
4098 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4099 OUTGOING_REGNO (REGNO (incoming)), 0);
4100 else if (MEM_P (incoming))
4102 rtx reg = XEXP (incoming, 0);
4103 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4105 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4106 incoming = replace_equiv_address_nv (incoming, reg);
4108 else
4109 incoming = copy_rtx (incoming);
4111 #endif
4113 ENTRY_VALUE_EXP (rtl) = incoming;
4114 return rtl;
4117 if (incoming
4118 && GET_MODE (incoming) != BLKmode
4119 && !TREE_ADDRESSABLE (decl)
4120 && MEM_P (incoming)
4121 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4122 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4123 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4124 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4125 return copy_rtx (incoming);
4127 return NULL_RTX;
4130 /* Return an RTX equivalent to the value of the tree expression EXP. */
4132 static rtx
4133 expand_debug_expr (tree exp)
4135 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4136 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4137 machine_mode inner_mode = VOIDmode;
4138 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4139 addr_space_t as;
4141 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4143 case tcc_expression:
4144 switch (TREE_CODE (exp))
4146 case COND_EXPR:
4147 case DOT_PROD_EXPR:
4148 case SAD_EXPR:
4149 case WIDEN_MULT_PLUS_EXPR:
4150 case WIDEN_MULT_MINUS_EXPR:
4151 case FMA_EXPR:
4152 goto ternary;
4154 case TRUTH_ANDIF_EXPR:
4155 case TRUTH_ORIF_EXPR:
4156 case TRUTH_AND_EXPR:
4157 case TRUTH_OR_EXPR:
4158 case TRUTH_XOR_EXPR:
4159 goto binary;
4161 case TRUTH_NOT_EXPR:
4162 goto unary;
4164 default:
4165 break;
4167 break;
4169 ternary:
4170 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4171 if (!op2)
4172 return NULL_RTX;
4173 /* Fall through. */
4175 binary:
4176 case tcc_binary:
4177 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4178 if (!op1)
4179 return NULL_RTX;
4180 switch (TREE_CODE (exp))
4182 case LSHIFT_EXPR:
4183 case RSHIFT_EXPR:
4184 case LROTATE_EXPR:
4185 case RROTATE_EXPR:
4186 case WIDEN_LSHIFT_EXPR:
4187 /* Ensure second operand isn't wider than the first one. */
4188 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4189 if (SCALAR_INT_MODE_P (inner_mode))
4191 machine_mode opmode = mode;
4192 if (VECTOR_MODE_P (mode))
4193 opmode = GET_MODE_INNER (mode);
4194 if (SCALAR_INT_MODE_P (opmode)
4195 && (GET_MODE_PRECISION (opmode)
4196 < GET_MODE_PRECISION (inner_mode)))
4197 op1 = lowpart_subreg (opmode, op1, inner_mode);
4199 break;
4200 default:
4201 break;
4203 /* Fall through. */
4205 unary:
4206 case tcc_unary:
4207 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4208 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4209 if (!op0)
4210 return NULL_RTX;
4211 break;
4213 case tcc_comparison:
4214 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4215 goto binary;
4217 case tcc_type:
4218 case tcc_statement:
4219 gcc_unreachable ();
4221 case tcc_constant:
4222 case tcc_exceptional:
4223 case tcc_declaration:
4224 case tcc_reference:
4225 case tcc_vl_exp:
4226 break;
4229 switch (TREE_CODE (exp))
4231 case STRING_CST:
4232 if (!lookup_constant_def (exp))
4234 if (strlen (TREE_STRING_POINTER (exp)) + 1
4235 != (size_t) TREE_STRING_LENGTH (exp))
4236 return NULL_RTX;
4237 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4238 op0 = gen_rtx_MEM (BLKmode, op0);
4239 set_mem_attributes (op0, exp, 0);
4240 return op0;
4242 /* Fall through. */
4244 case INTEGER_CST:
4245 case REAL_CST:
4246 case FIXED_CST:
4247 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4248 return op0;
4250 case COMPLEX_CST:
4251 gcc_assert (COMPLEX_MODE_P (mode));
4252 op0 = expand_debug_expr (TREE_REALPART (exp));
4253 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4254 return gen_rtx_CONCAT (mode, op0, op1);
4256 case DEBUG_EXPR_DECL:
4257 op0 = DECL_RTL_IF_SET (exp);
4259 if (op0)
4260 return op0;
4262 op0 = gen_rtx_DEBUG_EXPR (mode);
4263 DEBUG_EXPR_TREE_DECL (op0) = exp;
4264 SET_DECL_RTL (exp, op0);
4266 return op0;
4268 case VAR_DECL:
4269 case PARM_DECL:
4270 case FUNCTION_DECL:
4271 case LABEL_DECL:
4272 case CONST_DECL:
4273 case RESULT_DECL:
4274 op0 = DECL_RTL_IF_SET (exp);
4276 /* This decl was probably optimized away. */
4277 if (!op0)
4279 if (!VAR_P (exp)
4280 || DECL_EXTERNAL (exp)
4281 || !TREE_STATIC (exp)
4282 || !DECL_NAME (exp)
4283 || DECL_HARD_REGISTER (exp)
4284 || DECL_IN_CONSTANT_POOL (exp)
4285 || mode == VOIDmode)
4286 return NULL;
4288 op0 = make_decl_rtl_for_debug (exp);
4289 if (!MEM_P (op0)
4290 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4291 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4292 return NULL;
4294 else
4295 op0 = copy_rtx (op0);
4297 if (GET_MODE (op0) == BLKmode
4298 /* If op0 is not BLKmode, but mode is, adjust_mode
4299 below would ICE. While it is likely a FE bug,
4300 try to be robust here. See PR43166. */
4301 || mode == BLKmode
4302 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4304 gcc_assert (MEM_P (op0));
4305 op0 = adjust_address_nv (op0, mode, 0);
4306 return op0;
4309 /* Fall through. */
4311 adjust_mode:
4312 case PAREN_EXPR:
4313 CASE_CONVERT:
4315 inner_mode = GET_MODE (op0);
4317 if (mode == inner_mode)
4318 return op0;
4320 if (inner_mode == VOIDmode)
4322 if (TREE_CODE (exp) == SSA_NAME)
4323 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4324 else
4325 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4326 if (mode == inner_mode)
4327 return op0;
4330 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4332 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
4333 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4334 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
4335 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4336 else
4337 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4339 else if (FLOAT_MODE_P (mode))
4341 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4342 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4343 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4344 else
4345 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4347 else if (FLOAT_MODE_P (inner_mode))
4349 if (unsignedp)
4350 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4351 else
4352 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4354 else if (CONSTANT_P (op0)
4355 || GET_MODE_PRECISION (mode) <= GET_MODE_PRECISION (inner_mode))
4356 op0 = lowpart_subreg (mode, op0, inner_mode);
4357 else if (UNARY_CLASS_P (exp)
4358 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4359 : unsignedp)
4360 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4361 else
4362 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4364 return op0;
4367 case MEM_REF:
4368 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4370 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4371 TREE_OPERAND (exp, 0),
4372 TREE_OPERAND (exp, 1));
4373 if (newexp)
4374 return expand_debug_expr (newexp);
4376 /* FALLTHROUGH */
4377 case INDIRECT_REF:
4378 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4379 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4380 if (!op0)
4381 return NULL;
4383 if (TREE_CODE (exp) == MEM_REF)
4385 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4386 || (GET_CODE (op0) == PLUS
4387 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4388 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4389 Instead just use get_inner_reference. */
4390 goto component_ref;
4392 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4393 if (!op1 || !CONST_INT_P (op1))
4394 return NULL;
4396 op0 = plus_constant (inner_mode, op0, INTVAL (op1));
4399 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4401 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4402 op0, as);
4403 if (op0 == NULL_RTX)
4404 return NULL;
4406 op0 = gen_rtx_MEM (mode, op0);
4407 set_mem_attributes (op0, exp, 0);
4408 if (TREE_CODE (exp) == MEM_REF
4409 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4410 set_mem_expr (op0, NULL_TREE);
4411 set_mem_addr_space (op0, as);
4413 return op0;
4415 case TARGET_MEM_REF:
4416 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4417 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4418 return NULL;
4420 op0 = expand_debug_expr
4421 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4422 if (!op0)
4423 return NULL;
4425 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4426 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4427 op0, as);
4428 if (op0 == NULL_RTX)
4429 return NULL;
4431 op0 = gen_rtx_MEM (mode, op0);
4433 set_mem_attributes (op0, exp, 0);
4434 set_mem_addr_space (op0, as);
4436 return op0;
4438 component_ref:
4439 case ARRAY_REF:
4440 case ARRAY_RANGE_REF:
4441 case COMPONENT_REF:
4442 case BIT_FIELD_REF:
4443 case REALPART_EXPR:
4444 case IMAGPART_EXPR:
4445 case VIEW_CONVERT_EXPR:
4447 machine_mode mode1;
4448 HOST_WIDE_INT bitsize, bitpos;
4449 tree offset;
4450 int reversep, volatilep = 0;
4451 tree tem
4452 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4453 &unsignedp, &reversep, &volatilep);
4454 rtx orig_op0;
4456 if (bitsize == 0)
4457 return NULL;
4459 orig_op0 = op0 = expand_debug_expr (tem);
4461 if (!op0)
4462 return NULL;
4464 if (offset)
4466 machine_mode addrmode, offmode;
4468 if (!MEM_P (op0))
4469 return NULL;
4471 op0 = XEXP (op0, 0);
4472 addrmode = GET_MODE (op0);
4473 if (addrmode == VOIDmode)
4474 addrmode = Pmode;
4476 op1 = expand_debug_expr (offset);
4477 if (!op1)
4478 return NULL;
4480 offmode = GET_MODE (op1);
4481 if (offmode == VOIDmode)
4482 offmode = TYPE_MODE (TREE_TYPE (offset));
4484 if (addrmode != offmode)
4485 op1 = lowpart_subreg (addrmode, op1, offmode);
4487 /* Don't use offset_address here, we don't need a
4488 recognizable address, and we don't want to generate
4489 code. */
4490 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4491 op0, op1));
4494 if (MEM_P (op0))
4496 if (mode1 == VOIDmode)
4497 /* Bitfield. */
4498 mode1 = smallest_mode_for_size (bitsize, MODE_INT);
4499 if (bitpos >= BITS_PER_UNIT)
4501 op0 = adjust_address_nv (op0, mode1, bitpos / BITS_PER_UNIT);
4502 bitpos %= BITS_PER_UNIT;
4504 else if (bitpos < 0)
4506 HOST_WIDE_INT units
4507 = (-bitpos + BITS_PER_UNIT - 1) / BITS_PER_UNIT;
4508 op0 = adjust_address_nv (op0, mode1, -units);
4509 bitpos += units * BITS_PER_UNIT;
4511 else if (bitpos == 0 && bitsize == GET_MODE_BITSIZE (mode))
4512 op0 = adjust_address_nv (op0, mode, 0);
4513 else if (GET_MODE (op0) != mode1)
4514 op0 = adjust_address_nv (op0, mode1, 0);
4515 else
4516 op0 = copy_rtx (op0);
4517 if (op0 == orig_op0)
4518 op0 = shallow_copy_rtx (op0);
4519 set_mem_attributes (op0, exp, 0);
4522 if (bitpos == 0 && mode == GET_MODE (op0))
4523 return op0;
4525 if (bitpos < 0)
4526 return NULL;
4528 if (GET_MODE (op0) == BLKmode)
4529 return NULL;
4531 if ((bitpos % BITS_PER_UNIT) == 0
4532 && bitsize == GET_MODE_BITSIZE (mode1))
4534 machine_mode opmode = GET_MODE (op0);
4536 if (opmode == VOIDmode)
4537 opmode = TYPE_MODE (TREE_TYPE (tem));
4539 /* This condition may hold if we're expanding the address
4540 right past the end of an array that turned out not to
4541 be addressable (i.e., the address was only computed in
4542 debug stmts). The gen_subreg below would rightfully
4543 crash, and the address doesn't really exist, so just
4544 drop it. */
4545 if (bitpos >= GET_MODE_BITSIZE (opmode))
4546 return NULL;
4548 if ((bitpos % GET_MODE_BITSIZE (mode)) == 0)
4549 return simplify_gen_subreg (mode, op0, opmode,
4550 bitpos / BITS_PER_UNIT);
4553 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4554 && TYPE_UNSIGNED (TREE_TYPE (exp))
4555 ? SIGN_EXTRACT
4556 : ZERO_EXTRACT, mode,
4557 GET_MODE (op0) != VOIDmode
4558 ? GET_MODE (op0)
4559 : TYPE_MODE (TREE_TYPE (tem)),
4560 op0, GEN_INT (bitsize), GEN_INT (bitpos));
4563 case ABS_EXPR:
4564 return simplify_gen_unary (ABS, mode, op0, mode);
4566 case NEGATE_EXPR:
4567 return simplify_gen_unary (NEG, mode, op0, mode);
4569 case BIT_NOT_EXPR:
4570 return simplify_gen_unary (NOT, mode, op0, mode);
4572 case FLOAT_EXPR:
4573 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4574 0)))
4575 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4576 inner_mode);
4578 case FIX_TRUNC_EXPR:
4579 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4580 inner_mode);
4582 case POINTER_PLUS_EXPR:
4583 /* For the rare target where pointers are not the same size as
4584 size_t, we need to check for mis-matched modes and correct
4585 the addend. */
4586 if (op0 && op1
4587 && GET_MODE (op0) != VOIDmode && GET_MODE (op1) != VOIDmode
4588 && GET_MODE (op0) != GET_MODE (op1))
4590 if (GET_MODE_BITSIZE (GET_MODE (op0)) < GET_MODE_BITSIZE (GET_MODE (op1))
4591 /* If OP0 is a partial mode, then we must truncate, even if it has
4592 the same bitsize as OP1 as GCC's representation of partial modes
4593 is opaque. */
4594 || (GET_MODE_CLASS (GET_MODE (op0)) == MODE_PARTIAL_INT
4595 && GET_MODE_BITSIZE (GET_MODE (op0)) == GET_MODE_BITSIZE (GET_MODE (op1))))
4596 op1 = simplify_gen_unary (TRUNCATE, GET_MODE (op0), op1,
4597 GET_MODE (op1));
4598 else
4599 /* We always sign-extend, regardless of the signedness of
4600 the operand, because the operand is always unsigned
4601 here even if the original C expression is signed. */
4602 op1 = simplify_gen_unary (SIGN_EXTEND, GET_MODE (op0), op1,
4603 GET_MODE (op1));
4605 /* Fall through. */
4606 case PLUS_EXPR:
4607 return simplify_gen_binary (PLUS, mode, op0, op1);
4609 case MINUS_EXPR:
4610 return simplify_gen_binary (MINUS, mode, op0, op1);
4612 case MULT_EXPR:
4613 return simplify_gen_binary (MULT, mode, op0, op1);
4615 case RDIV_EXPR:
4616 case TRUNC_DIV_EXPR:
4617 case EXACT_DIV_EXPR:
4618 if (unsignedp)
4619 return simplify_gen_binary (UDIV, mode, op0, op1);
4620 else
4621 return simplify_gen_binary (DIV, mode, op0, op1);
4623 case TRUNC_MOD_EXPR:
4624 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4626 case FLOOR_DIV_EXPR:
4627 if (unsignedp)
4628 return simplify_gen_binary (UDIV, mode, op0, op1);
4629 else
4631 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4632 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4633 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4634 return simplify_gen_binary (PLUS, mode, div, adj);
4637 case FLOOR_MOD_EXPR:
4638 if (unsignedp)
4639 return simplify_gen_binary (UMOD, mode, op0, op1);
4640 else
4642 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4643 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4644 adj = simplify_gen_unary (NEG, mode,
4645 simplify_gen_binary (MULT, mode, adj, op1),
4646 mode);
4647 return simplify_gen_binary (PLUS, mode, mod, adj);
4650 case CEIL_DIV_EXPR:
4651 if (unsignedp)
4653 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4654 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4655 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4656 return simplify_gen_binary (PLUS, mode, div, adj);
4658 else
4660 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4661 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4662 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4663 return simplify_gen_binary (PLUS, mode, div, adj);
4666 case CEIL_MOD_EXPR:
4667 if (unsignedp)
4669 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4670 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4671 adj = simplify_gen_unary (NEG, mode,
4672 simplify_gen_binary (MULT, mode, adj, op1),
4673 mode);
4674 return simplify_gen_binary (PLUS, mode, mod, adj);
4676 else
4678 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4679 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4680 adj = simplify_gen_unary (NEG, mode,
4681 simplify_gen_binary (MULT, mode, adj, op1),
4682 mode);
4683 return simplify_gen_binary (PLUS, mode, mod, adj);
4686 case ROUND_DIV_EXPR:
4687 if (unsignedp)
4689 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4690 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4691 rtx adj = round_udiv_adjust (mode, mod, op1);
4692 return simplify_gen_binary (PLUS, mode, div, adj);
4694 else
4696 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4697 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4698 rtx adj = round_sdiv_adjust (mode, mod, op1);
4699 return simplify_gen_binary (PLUS, mode, div, adj);
4702 case ROUND_MOD_EXPR:
4703 if (unsignedp)
4705 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4706 rtx adj = round_udiv_adjust (mode, mod, op1);
4707 adj = simplify_gen_unary (NEG, mode,
4708 simplify_gen_binary (MULT, mode, adj, op1),
4709 mode);
4710 return simplify_gen_binary (PLUS, mode, mod, adj);
4712 else
4714 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4715 rtx adj = round_sdiv_adjust (mode, mod, op1);
4716 adj = simplify_gen_unary (NEG, mode,
4717 simplify_gen_binary (MULT, mode, adj, op1),
4718 mode);
4719 return simplify_gen_binary (PLUS, mode, mod, adj);
4722 case LSHIFT_EXPR:
4723 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4725 case RSHIFT_EXPR:
4726 if (unsignedp)
4727 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4728 else
4729 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4731 case LROTATE_EXPR:
4732 return simplify_gen_binary (ROTATE, mode, op0, op1);
4734 case RROTATE_EXPR:
4735 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4737 case MIN_EXPR:
4738 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4740 case MAX_EXPR:
4741 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4743 case BIT_AND_EXPR:
4744 case TRUTH_AND_EXPR:
4745 return simplify_gen_binary (AND, mode, op0, op1);
4747 case BIT_IOR_EXPR:
4748 case TRUTH_OR_EXPR:
4749 return simplify_gen_binary (IOR, mode, op0, op1);
4751 case BIT_XOR_EXPR:
4752 case TRUTH_XOR_EXPR:
4753 return simplify_gen_binary (XOR, mode, op0, op1);
4755 case TRUTH_ANDIF_EXPR:
4756 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4758 case TRUTH_ORIF_EXPR:
4759 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4761 case TRUTH_NOT_EXPR:
4762 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4764 case LT_EXPR:
4765 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4766 op0, op1);
4768 case LE_EXPR:
4769 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4770 op0, op1);
4772 case GT_EXPR:
4773 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4774 op0, op1);
4776 case GE_EXPR:
4777 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4778 op0, op1);
4780 case EQ_EXPR:
4781 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4783 case NE_EXPR:
4784 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4786 case UNORDERED_EXPR:
4787 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4789 case ORDERED_EXPR:
4790 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4792 case UNLT_EXPR:
4793 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4795 case UNLE_EXPR:
4796 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4798 case UNGT_EXPR:
4799 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4801 case UNGE_EXPR:
4802 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4804 case UNEQ_EXPR:
4805 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4807 case LTGT_EXPR:
4808 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4810 case COND_EXPR:
4811 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4813 case COMPLEX_EXPR:
4814 gcc_assert (COMPLEX_MODE_P (mode));
4815 if (GET_MODE (op0) == VOIDmode)
4816 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4817 if (GET_MODE (op1) == VOIDmode)
4818 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4819 return gen_rtx_CONCAT (mode, op0, op1);
4821 case CONJ_EXPR:
4822 if (GET_CODE (op0) == CONCAT)
4823 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4824 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4825 XEXP (op0, 1),
4826 GET_MODE_INNER (mode)));
4827 else
4829 machine_mode imode = GET_MODE_INNER (mode);
4830 rtx re, im;
4832 if (MEM_P (op0))
4834 re = adjust_address_nv (op0, imode, 0);
4835 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4837 else
4839 machine_mode ifmode = int_mode_for_mode (mode);
4840 machine_mode ihmode = int_mode_for_mode (imode);
4841 rtx halfsize;
4842 if (ifmode == BLKmode || ihmode == BLKmode)
4843 return NULL;
4844 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4845 re = op0;
4846 if (mode != ifmode)
4847 re = gen_rtx_SUBREG (ifmode, re, 0);
4848 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4849 if (imode != ihmode)
4850 re = gen_rtx_SUBREG (imode, re, 0);
4851 im = copy_rtx (op0);
4852 if (mode != ifmode)
4853 im = gen_rtx_SUBREG (ifmode, im, 0);
4854 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4855 if (imode != ihmode)
4856 im = gen_rtx_SUBREG (imode, im, 0);
4858 im = gen_rtx_NEG (imode, im);
4859 return gen_rtx_CONCAT (mode, re, im);
4862 case ADDR_EXPR:
4863 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4864 if (!op0 || !MEM_P (op0))
4866 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
4867 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
4868 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
4869 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
4870 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
4871 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
4873 if (handled_component_p (TREE_OPERAND (exp, 0)))
4875 HOST_WIDE_INT bitoffset, bitsize, maxsize;
4876 bool reverse;
4877 tree decl
4878 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
4879 &bitsize, &maxsize, &reverse);
4880 if ((VAR_P (decl)
4881 || TREE_CODE (decl) == PARM_DECL
4882 || TREE_CODE (decl) == RESULT_DECL)
4883 && (!TREE_ADDRESSABLE (decl)
4884 || target_for_debug_bind (decl))
4885 && (bitoffset % BITS_PER_UNIT) == 0
4886 && bitsize > 0
4887 && bitsize == maxsize)
4889 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
4890 return plus_constant (mode, base, bitoffset / BITS_PER_UNIT);
4894 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
4895 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
4896 == ADDR_EXPR)
4898 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4899 0));
4900 if (op0 != NULL
4901 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4902 || (GET_CODE (op0) == PLUS
4903 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
4904 && CONST_INT_P (XEXP (op0, 1)))))
4906 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4907 1));
4908 if (!op1 || !CONST_INT_P (op1))
4909 return NULL;
4911 return plus_constant (mode, op0, INTVAL (op1));
4915 return NULL;
4918 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
4919 op0 = convert_debug_memory_address (mode, XEXP (op0, 0), as);
4921 return op0;
4923 case VECTOR_CST:
4925 unsigned i;
4927 op0 = gen_rtx_CONCATN
4928 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4930 for (i = 0; i < VECTOR_CST_NELTS (exp); ++i)
4932 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
4933 if (!op1)
4934 return NULL;
4935 XVECEXP (op0, 0, i) = op1;
4938 return op0;
4941 case CONSTRUCTOR:
4942 if (TREE_CLOBBER_P (exp))
4943 return NULL;
4944 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
4946 unsigned i;
4947 tree val;
4949 op0 = gen_rtx_CONCATN
4950 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4952 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
4954 op1 = expand_debug_expr (val);
4955 if (!op1)
4956 return NULL;
4957 XVECEXP (op0, 0, i) = op1;
4960 if (i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)))
4962 op1 = expand_debug_expr
4963 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
4965 if (!op1)
4966 return NULL;
4968 for (; i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)); i++)
4969 XVECEXP (op0, 0, i) = op1;
4972 return op0;
4974 else
4975 goto flag_unsupported;
4977 case CALL_EXPR:
4978 /* ??? Maybe handle some builtins? */
4979 return NULL;
4981 case SSA_NAME:
4983 gimple *g = get_gimple_for_ssa_name (exp);
4984 if (g)
4986 tree t = NULL_TREE;
4987 if (deep_ter_debug_map)
4989 tree *slot = deep_ter_debug_map->get (exp);
4990 if (slot)
4991 t = *slot;
4993 if (t == NULL_TREE)
4994 t = gimple_assign_rhs_to_tree (g);
4995 op0 = expand_debug_expr (t);
4996 if (!op0)
4997 return NULL;
4999 else
5001 /* If this is a reference to an incoming value of
5002 parameter that is never used in the code or where the
5003 incoming value is never used in the code, use
5004 PARM_DECL's DECL_RTL if set. */
5005 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5006 && SSA_NAME_VAR (exp)
5007 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5008 && has_zero_uses (exp))
5010 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5011 if (op0)
5012 goto adjust_mode;
5013 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5014 if (op0)
5015 goto adjust_mode;
5018 int part = var_to_partition (SA.map, exp);
5020 if (part == NO_PARTITION)
5021 return NULL;
5023 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5025 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5027 goto adjust_mode;
5030 case ERROR_MARK:
5031 return NULL;
5033 /* Vector stuff. For most of the codes we don't have rtl codes. */
5034 case REALIGN_LOAD_EXPR:
5035 case REDUC_MAX_EXPR:
5036 case REDUC_MIN_EXPR:
5037 case REDUC_PLUS_EXPR:
5038 case VEC_COND_EXPR:
5039 case VEC_PACK_FIX_TRUNC_EXPR:
5040 case VEC_PACK_SAT_EXPR:
5041 case VEC_PACK_TRUNC_EXPR:
5042 case VEC_UNPACK_FLOAT_HI_EXPR:
5043 case VEC_UNPACK_FLOAT_LO_EXPR:
5044 case VEC_UNPACK_HI_EXPR:
5045 case VEC_UNPACK_LO_EXPR:
5046 case VEC_WIDEN_MULT_HI_EXPR:
5047 case VEC_WIDEN_MULT_LO_EXPR:
5048 case VEC_WIDEN_MULT_EVEN_EXPR:
5049 case VEC_WIDEN_MULT_ODD_EXPR:
5050 case VEC_WIDEN_LSHIFT_HI_EXPR:
5051 case VEC_WIDEN_LSHIFT_LO_EXPR:
5052 case VEC_PERM_EXPR:
5053 return NULL;
5055 /* Misc codes. */
5056 case ADDR_SPACE_CONVERT_EXPR:
5057 case FIXED_CONVERT_EXPR:
5058 case OBJ_TYPE_REF:
5059 case WITH_SIZE_EXPR:
5060 case BIT_INSERT_EXPR:
5061 return NULL;
5063 case DOT_PROD_EXPR:
5064 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5065 && SCALAR_INT_MODE_P (mode))
5068 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5069 0)))
5070 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5071 inner_mode);
5073 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5074 1)))
5075 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5076 inner_mode);
5077 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5078 return simplify_gen_binary (PLUS, mode, op0, op2);
5080 return NULL;
5082 case WIDEN_MULT_EXPR:
5083 case WIDEN_MULT_PLUS_EXPR:
5084 case WIDEN_MULT_MINUS_EXPR:
5085 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5086 && SCALAR_INT_MODE_P (mode))
5088 inner_mode = GET_MODE (op0);
5089 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5090 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5091 else
5092 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5093 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5094 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5095 else
5096 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5097 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5098 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5099 return op0;
5100 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5101 return simplify_gen_binary (PLUS, mode, op0, op2);
5102 else
5103 return simplify_gen_binary (MINUS, mode, op2, op0);
5105 return NULL;
5107 case MULT_HIGHPART_EXPR:
5108 /* ??? Similar to the above. */
5109 return NULL;
5111 case WIDEN_SUM_EXPR:
5112 case WIDEN_LSHIFT_EXPR:
5113 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5114 && SCALAR_INT_MODE_P (mode))
5117 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5118 0)))
5119 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5120 inner_mode);
5121 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5122 ? ASHIFT : PLUS, mode, op0, op1);
5124 return NULL;
5126 case FMA_EXPR:
5127 return simplify_gen_ternary (FMA, mode, inner_mode, op0, op1, op2);
5129 default:
5130 flag_unsupported:
5131 if (flag_checking)
5133 debug_tree (exp);
5134 gcc_unreachable ();
5136 return NULL;
5140 /* Return an RTX equivalent to the source bind value of the tree expression
5141 EXP. */
5143 static rtx
5144 expand_debug_source_expr (tree exp)
5146 rtx op0 = NULL_RTX;
5147 machine_mode mode = VOIDmode, inner_mode;
5149 switch (TREE_CODE (exp))
5151 case PARM_DECL:
5153 mode = DECL_MODE (exp);
5154 op0 = expand_debug_parm_decl (exp);
5155 if (op0)
5156 break;
5157 /* See if this isn't an argument that has been completely
5158 optimized out. */
5159 if (!DECL_RTL_SET_P (exp)
5160 && !DECL_INCOMING_RTL (exp)
5161 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5163 tree aexp = DECL_ORIGIN (exp);
5164 if (DECL_CONTEXT (aexp)
5165 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5167 vec<tree, va_gc> **debug_args;
5168 unsigned int ix;
5169 tree ddecl;
5170 debug_args = decl_debug_args_lookup (current_function_decl);
5171 if (debug_args != NULL)
5173 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5174 ix += 2)
5175 if (ddecl == aexp)
5176 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5180 break;
5182 default:
5183 break;
5186 if (op0 == NULL_RTX)
5187 return NULL_RTX;
5189 inner_mode = GET_MODE (op0);
5190 if (mode == inner_mode)
5191 return op0;
5193 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5195 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
5196 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5197 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
5198 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5199 else
5200 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5202 else if (FLOAT_MODE_P (mode))
5203 gcc_unreachable ();
5204 else if (FLOAT_MODE_P (inner_mode))
5206 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5207 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5208 else
5209 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5211 else if (CONSTANT_P (op0)
5212 || GET_MODE_BITSIZE (mode) <= GET_MODE_BITSIZE (inner_mode))
5213 op0 = lowpart_subreg (mode, op0, inner_mode);
5214 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5215 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5216 else
5217 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5219 return op0;
5222 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5223 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5224 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5226 static void
5227 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5229 rtx exp = *exp_p;
5231 if (exp == NULL_RTX)
5232 return;
5234 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5235 return;
5237 if (depth == 4)
5239 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5240 rtx dval = make_debug_expr_from_rtl (exp);
5242 /* Emit a debug bind insn before INSN. */
5243 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5244 DEBUG_EXPR_TREE_DECL (dval), exp,
5245 VAR_INIT_STATUS_INITIALIZED);
5247 emit_debug_insn_before (bind, insn);
5248 *exp_p = dval;
5249 return;
5252 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5253 int i, j;
5254 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5255 switch (*format_ptr++)
5257 case 'e':
5258 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5259 break;
5261 case 'E':
5262 case 'V':
5263 for (j = 0; j < XVECLEN (exp, i); j++)
5264 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5265 break;
5267 default:
5268 break;
5272 /* Expand the _LOCs in debug insns. We run this after expanding all
5273 regular insns, so that any variables referenced in the function
5274 will have their DECL_RTLs set. */
5276 static void
5277 expand_debug_locations (void)
5279 rtx_insn *insn;
5280 rtx_insn *last = get_last_insn ();
5281 int save_strict_alias = flag_strict_aliasing;
5283 /* New alias sets while setting up memory attributes cause
5284 -fcompare-debug failures, even though it doesn't bring about any
5285 codegen changes. */
5286 flag_strict_aliasing = 0;
5288 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5289 if (DEBUG_INSN_P (insn))
5291 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5292 rtx val;
5293 rtx_insn *prev_insn, *insn2;
5294 machine_mode mode;
5296 if (value == NULL_TREE)
5297 val = NULL_RTX;
5298 else
5300 if (INSN_VAR_LOCATION_STATUS (insn)
5301 == VAR_INIT_STATUS_UNINITIALIZED)
5302 val = expand_debug_source_expr (value);
5303 /* The avoid_deep_ter_for_debug function inserts
5304 debug bind stmts after SSA_NAME definition, with the
5305 SSA_NAME as the whole bind location. Disable temporarily
5306 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5307 being defined in this DEBUG_INSN. */
5308 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5310 tree *slot = deep_ter_debug_map->get (value);
5311 if (slot)
5313 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5314 *slot = NULL_TREE;
5315 else
5316 slot = NULL;
5318 val = expand_debug_expr (value);
5319 if (slot)
5320 *slot = INSN_VAR_LOCATION_DECL (insn);
5322 else
5323 val = expand_debug_expr (value);
5324 gcc_assert (last == get_last_insn ());
5327 if (!val)
5328 val = gen_rtx_UNKNOWN_VAR_LOC ();
5329 else
5331 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5333 gcc_assert (mode == GET_MODE (val)
5334 || (GET_MODE (val) == VOIDmode
5335 && (CONST_SCALAR_INT_P (val)
5336 || GET_CODE (val) == CONST_FIXED
5337 || GET_CODE (val) == LABEL_REF)));
5340 INSN_VAR_LOCATION_LOC (insn) = val;
5341 prev_insn = PREV_INSN (insn);
5342 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5343 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5346 flag_strict_aliasing = save_strict_alias;
5349 /* Performs swapping operands of commutative operations to expand
5350 the expensive one first. */
5352 static void
5353 reorder_operands (basic_block bb)
5355 unsigned int *lattice; /* Hold cost of each statement. */
5356 unsigned int i = 0, n = 0;
5357 gimple_stmt_iterator gsi;
5358 gimple_seq stmts;
5359 gimple *stmt;
5360 bool swap;
5361 tree op0, op1;
5362 ssa_op_iter iter;
5363 use_operand_p use_p;
5364 gimple *def0, *def1;
5366 /* Compute cost of each statement using estimate_num_insns. */
5367 stmts = bb_seq (bb);
5368 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5370 stmt = gsi_stmt (gsi);
5371 if (!is_gimple_debug (stmt))
5372 gimple_set_uid (stmt, n++);
5374 lattice = XNEWVEC (unsigned int, n);
5375 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5377 unsigned cost;
5378 stmt = gsi_stmt (gsi);
5379 if (is_gimple_debug (stmt))
5380 continue;
5381 cost = estimate_num_insns (stmt, &eni_size_weights);
5382 lattice[i] = cost;
5383 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5385 tree use = USE_FROM_PTR (use_p);
5386 gimple *def_stmt;
5387 if (TREE_CODE (use) != SSA_NAME)
5388 continue;
5389 def_stmt = get_gimple_for_ssa_name (use);
5390 if (!def_stmt)
5391 continue;
5392 lattice[i] += lattice[gimple_uid (def_stmt)];
5394 i++;
5395 if (!is_gimple_assign (stmt)
5396 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5397 continue;
5398 op0 = gimple_op (stmt, 1);
5399 op1 = gimple_op (stmt, 2);
5400 if (TREE_CODE (op0) != SSA_NAME
5401 || TREE_CODE (op1) != SSA_NAME)
5402 continue;
5403 /* Swap operands if the second one is more expensive. */
5404 def0 = get_gimple_for_ssa_name (op0);
5405 def1 = get_gimple_for_ssa_name (op1);
5406 if (!def1)
5407 continue;
5408 swap = false;
5409 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5410 swap = true;
5411 if (swap)
5413 if (dump_file && (dump_flags & TDF_DETAILS))
5415 fprintf (dump_file, "Swap operands in stmt:\n");
5416 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5417 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5418 def0 ? lattice[gimple_uid (def0)] : 0,
5419 lattice[gimple_uid (def1)]);
5421 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5422 gimple_assign_rhs2_ptr (stmt));
5425 XDELETE (lattice);
5428 /* Expand basic block BB from GIMPLE trees to RTL. */
5430 static basic_block
5431 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5433 gimple_stmt_iterator gsi;
5434 gimple_seq stmts;
5435 gimple *stmt = NULL;
5436 rtx_note *note;
5437 rtx_insn *last;
5438 edge e;
5439 edge_iterator ei;
5441 if (dump_file)
5442 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5443 bb->index);
5445 /* Note that since we are now transitioning from GIMPLE to RTL, we
5446 cannot use the gsi_*_bb() routines because they expect the basic
5447 block to be in GIMPLE, instead of RTL. Therefore, we need to
5448 access the BB sequence directly. */
5449 if (optimize)
5450 reorder_operands (bb);
5451 stmts = bb_seq (bb);
5452 bb->il.gimple.seq = NULL;
5453 bb->il.gimple.phi_nodes = NULL;
5454 rtl_profile_for_bb (bb);
5455 init_rtl_bb_info (bb);
5456 bb->flags |= BB_RTL;
5458 /* Remove the RETURN_EXPR if we may fall though to the exit
5459 instead. */
5460 gsi = gsi_last (stmts);
5461 if (!gsi_end_p (gsi)
5462 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5464 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5466 gcc_assert (single_succ_p (bb));
5467 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5469 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5470 && !gimple_return_retval (ret_stmt))
5472 gsi_remove (&gsi, false);
5473 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5477 gsi = gsi_start (stmts);
5478 if (!gsi_end_p (gsi))
5480 stmt = gsi_stmt (gsi);
5481 if (gimple_code (stmt) != GIMPLE_LABEL)
5482 stmt = NULL;
5485 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5487 if (stmt || elt)
5489 last = get_last_insn ();
5491 if (stmt)
5493 expand_gimple_stmt (stmt);
5494 gsi_next (&gsi);
5497 if (elt)
5498 emit_label (*elt);
5500 BB_HEAD (bb) = NEXT_INSN (last);
5501 if (NOTE_P (BB_HEAD (bb)))
5502 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5503 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5505 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5507 else
5508 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5510 NOTE_BASIC_BLOCK (note) = bb;
5512 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5514 basic_block new_bb;
5516 stmt = gsi_stmt (gsi);
5518 /* If this statement is a non-debug one, and we generate debug
5519 insns, then this one might be the last real use of a TERed
5520 SSA_NAME, but where there are still some debug uses further
5521 down. Expanding the current SSA name in such further debug
5522 uses by their RHS might lead to wrong debug info, as coalescing
5523 might make the operands of such RHS be placed into the same
5524 pseudo as something else. Like so:
5525 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5526 use(a_1);
5527 a_2 = ...
5528 #DEBUG ... => a_1
5529 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5530 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5531 the write to a_2 would actually have clobbered the place which
5532 formerly held a_0.
5534 So, instead of that, we recognize the situation, and generate
5535 debug temporaries at the last real use of TERed SSA names:
5536 a_1 = a_0 + 1;
5537 #DEBUG #D1 => a_1
5538 use(a_1);
5539 a_2 = ...
5540 #DEBUG ... => #D1
5542 if (MAY_HAVE_DEBUG_INSNS
5543 && SA.values
5544 && !is_gimple_debug (stmt))
5546 ssa_op_iter iter;
5547 tree op;
5548 gimple *def;
5550 location_t sloc = curr_insn_location ();
5552 /* Look for SSA names that have their last use here (TERed
5553 names always have only one real use). */
5554 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5555 if ((def = get_gimple_for_ssa_name (op)))
5557 imm_use_iterator imm_iter;
5558 use_operand_p use_p;
5559 bool have_debug_uses = false;
5561 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5563 if (gimple_debug_bind_p (USE_STMT (use_p)))
5565 have_debug_uses = true;
5566 break;
5570 if (have_debug_uses)
5572 /* OP is a TERed SSA name, with DEF its defining
5573 statement, and where OP is used in further debug
5574 instructions. Generate a debug temporary, and
5575 replace all uses of OP in debug insns with that
5576 temporary. */
5577 gimple *debugstmt;
5578 tree value = gimple_assign_rhs_to_tree (def);
5579 tree vexpr = make_node (DEBUG_EXPR_DECL);
5580 rtx val;
5581 machine_mode mode;
5583 set_curr_insn_location (gimple_location (def));
5585 DECL_ARTIFICIAL (vexpr) = 1;
5586 TREE_TYPE (vexpr) = TREE_TYPE (value);
5587 if (DECL_P (value))
5588 mode = DECL_MODE (value);
5589 else
5590 mode = TYPE_MODE (TREE_TYPE (value));
5591 SET_DECL_MODE (vexpr, mode);
5593 val = gen_rtx_VAR_LOCATION
5594 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5596 emit_debug_insn (val);
5598 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5600 if (!gimple_debug_bind_p (debugstmt))
5601 continue;
5603 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5604 SET_USE (use_p, vexpr);
5606 update_stmt (debugstmt);
5610 set_curr_insn_location (sloc);
5613 currently_expanding_gimple_stmt = stmt;
5615 /* Expand this statement, then evaluate the resulting RTL and
5616 fixup the CFG accordingly. */
5617 if (gimple_code (stmt) == GIMPLE_COND)
5619 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5620 if (new_bb)
5621 return new_bb;
5623 else if (gimple_debug_bind_p (stmt))
5625 location_t sloc = curr_insn_location ();
5626 gimple_stmt_iterator nsi = gsi;
5628 for (;;)
5630 tree var = gimple_debug_bind_get_var (stmt);
5631 tree value;
5632 rtx val;
5633 machine_mode mode;
5635 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5636 && TREE_CODE (var) != LABEL_DECL
5637 && !target_for_debug_bind (var))
5638 goto delink_debug_stmt;
5640 if (gimple_debug_bind_has_value_p (stmt))
5641 value = gimple_debug_bind_get_value (stmt);
5642 else
5643 value = NULL_TREE;
5645 last = get_last_insn ();
5647 set_curr_insn_location (gimple_location (stmt));
5649 if (DECL_P (var))
5650 mode = DECL_MODE (var);
5651 else
5652 mode = TYPE_MODE (TREE_TYPE (var));
5654 val = gen_rtx_VAR_LOCATION
5655 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5657 emit_debug_insn (val);
5659 if (dump_file && (dump_flags & TDF_DETAILS))
5661 /* We can't dump the insn with a TREE where an RTX
5662 is expected. */
5663 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5664 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5665 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5668 delink_debug_stmt:
5669 /* In order not to generate too many debug temporaries,
5670 we delink all uses of debug statements we already expanded.
5671 Therefore debug statements between definition and real
5672 use of TERed SSA names will continue to use the SSA name,
5673 and not be replaced with debug temps. */
5674 delink_stmt_imm_use (stmt);
5676 gsi = nsi;
5677 gsi_next (&nsi);
5678 if (gsi_end_p (nsi))
5679 break;
5680 stmt = gsi_stmt (nsi);
5681 if (!gimple_debug_bind_p (stmt))
5682 break;
5685 set_curr_insn_location (sloc);
5687 else if (gimple_debug_source_bind_p (stmt))
5689 location_t sloc = curr_insn_location ();
5690 tree var = gimple_debug_source_bind_get_var (stmt);
5691 tree value = gimple_debug_source_bind_get_value (stmt);
5692 rtx val;
5693 machine_mode mode;
5695 last = get_last_insn ();
5697 set_curr_insn_location (gimple_location (stmt));
5699 mode = DECL_MODE (var);
5701 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5702 VAR_INIT_STATUS_UNINITIALIZED);
5704 emit_debug_insn (val);
5706 if (dump_file && (dump_flags & TDF_DETAILS))
5708 /* We can't dump the insn with a TREE where an RTX
5709 is expected. */
5710 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5711 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5712 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5715 set_curr_insn_location (sloc);
5717 else
5719 gcall *call_stmt = dyn_cast <gcall *> (stmt);
5720 if (call_stmt
5721 && gimple_call_tail_p (call_stmt)
5722 && disable_tail_calls)
5723 gimple_call_set_tail (call_stmt, false);
5725 if (call_stmt && gimple_call_tail_p (call_stmt))
5727 bool can_fallthru;
5728 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
5729 if (new_bb)
5731 if (can_fallthru)
5732 bb = new_bb;
5733 else
5734 return new_bb;
5737 else
5739 def_operand_p def_p;
5740 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5742 if (def_p != NULL)
5744 /* Ignore this stmt if it is in the list of
5745 replaceable expressions. */
5746 if (SA.values
5747 && bitmap_bit_p (SA.values,
5748 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5749 continue;
5751 last = expand_gimple_stmt (stmt);
5752 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5757 currently_expanding_gimple_stmt = NULL;
5759 /* Expand implicit goto and convert goto_locus. */
5760 FOR_EACH_EDGE (e, ei, bb->succs)
5762 if (e->goto_locus != UNKNOWN_LOCATION)
5763 set_curr_insn_location (e->goto_locus);
5764 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5766 emit_jump (label_rtx_for_bb (e->dest));
5767 e->flags &= ~EDGE_FALLTHRU;
5771 /* Expanded RTL can create a jump in the last instruction of block.
5772 This later might be assumed to be a jump to successor and break edge insertion.
5773 We need to insert dummy move to prevent this. PR41440. */
5774 if (single_succ_p (bb)
5775 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5776 && (last = get_last_insn ())
5777 && (JUMP_P (last)
5778 || (DEBUG_INSN_P (last)
5779 && JUMP_P (prev_nondebug_insn (last)))))
5781 rtx dummy = gen_reg_rtx (SImode);
5782 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5785 do_pending_stack_adjust ();
5787 /* Find the block tail. The last insn in the block is the insn
5788 before a barrier and/or table jump insn. */
5789 last = get_last_insn ();
5790 if (BARRIER_P (last))
5791 last = PREV_INSN (last);
5792 if (JUMP_TABLE_DATA_P (last))
5793 last = PREV_INSN (PREV_INSN (last));
5794 BB_END (bb) = last;
5796 update_bb_for_insn (bb);
5798 return bb;
5802 /* Create a basic block for initialization code. */
5804 static basic_block
5805 construct_init_block (void)
5807 basic_block init_block, first_block;
5808 edge e = NULL;
5809 int flags;
5811 /* Multiple entry points not supported yet. */
5812 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5813 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5814 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5815 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5816 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5818 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5820 /* When entry edge points to first basic block, we don't need jump,
5821 otherwise we have to jump into proper target. */
5822 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5824 tree label = gimple_block_label (e->dest);
5826 emit_jump (jump_target_rtx (label));
5827 flags = 0;
5829 else
5830 flags = EDGE_FALLTHRU;
5832 init_block = create_basic_block (NEXT_INSN (get_insns ()),
5833 get_last_insn (),
5834 ENTRY_BLOCK_PTR_FOR_FN (cfun));
5835 init_block->frequency = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency;
5836 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5837 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5838 if (e)
5840 first_block = e->dest;
5841 redirect_edge_succ (e, init_block);
5842 e = make_single_succ_edge (init_block, first_block, flags);
5844 else
5845 e = make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5846 EDGE_FALLTHRU);
5848 update_bb_for_insn (init_block);
5849 return init_block;
5852 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
5853 found in the block tree. */
5855 static void
5856 set_block_levels (tree block, int level)
5858 while (block)
5860 BLOCK_NUMBER (block) = level;
5861 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
5862 block = BLOCK_CHAIN (block);
5866 /* Create a block containing landing pads and similar stuff. */
5868 static void
5869 construct_exit_block (void)
5871 rtx_insn *head = get_last_insn ();
5872 rtx_insn *end;
5873 basic_block exit_block;
5874 edge e, e2;
5875 unsigned ix;
5876 edge_iterator ei;
5877 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
5878 rtx_insn *orig_end = BB_END (prev_bb);
5880 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5882 /* Make sure the locus is set to the end of the function, so that
5883 epilogue line numbers and warnings are set properly. */
5884 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
5885 input_location = cfun->function_end_locus;
5887 /* Generate rtl for function exit. */
5888 expand_function_end ();
5890 end = get_last_insn ();
5891 if (head == end)
5892 return;
5893 /* While emitting the function end we could move end of the last basic
5894 block. */
5895 BB_END (prev_bb) = orig_end;
5896 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
5897 head = NEXT_INSN (head);
5898 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
5899 bb frequency counting will be confused. Any instructions before that
5900 label are emitted for the case where PREV_BB falls through into the
5901 exit block, so append those instructions to prev_bb in that case. */
5902 if (NEXT_INSN (head) != return_label)
5904 while (NEXT_INSN (head) != return_label)
5906 if (!NOTE_P (NEXT_INSN (head)))
5907 BB_END (prev_bb) = NEXT_INSN (head);
5908 head = NEXT_INSN (head);
5911 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
5912 exit_block->frequency = EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency;
5913 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5914 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5916 ix = 0;
5917 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
5919 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
5920 if (!(e->flags & EDGE_ABNORMAL))
5921 redirect_edge_succ (e, exit_block);
5922 else
5923 ix++;
5926 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
5927 EDGE_FALLTHRU);
5928 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
5929 if (e2 != e)
5931 e->count -= e2->count;
5932 exit_block->count -= e2->count;
5933 exit_block->frequency -= EDGE_FREQUENCY (e2);
5935 if (exit_block->frequency < 0)
5936 exit_block->frequency = 0;
5937 update_bb_for_insn (exit_block);
5940 /* Helper function for discover_nonconstant_array_refs.
5941 Look for ARRAY_REF nodes with non-constant indexes and mark them
5942 addressable. */
5944 static tree
5945 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
5946 void *data ATTRIBUTE_UNUSED)
5948 tree t = *tp;
5950 if (IS_TYPE_OR_DECL_P (t))
5951 *walk_subtrees = 0;
5952 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5954 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5955 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
5956 && (!TREE_OPERAND (t, 2)
5957 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5958 || (TREE_CODE (t) == COMPONENT_REF
5959 && (!TREE_OPERAND (t,2)
5960 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5961 || TREE_CODE (t) == BIT_FIELD_REF
5962 || TREE_CODE (t) == REALPART_EXPR
5963 || TREE_CODE (t) == IMAGPART_EXPR
5964 || TREE_CODE (t) == VIEW_CONVERT_EXPR
5965 || CONVERT_EXPR_P (t))
5966 t = TREE_OPERAND (t, 0);
5968 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5970 t = get_base_address (t);
5971 if (t && DECL_P (t)
5972 && DECL_MODE (t) != BLKmode)
5973 TREE_ADDRESSABLE (t) = 1;
5976 *walk_subtrees = 0;
5979 return NULL_TREE;
5982 /* RTL expansion is not able to compile array references with variable
5983 offsets for arrays stored in single register. Discover such
5984 expressions and mark variables as addressable to avoid this
5985 scenario. */
5987 static void
5988 discover_nonconstant_array_refs (void)
5990 basic_block bb;
5991 gimple_stmt_iterator gsi;
5993 FOR_EACH_BB_FN (bb, cfun)
5994 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
5996 gimple *stmt = gsi_stmt (gsi);
5997 if (!is_gimple_debug (stmt))
5998 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
6002 /* This function sets crtl->args.internal_arg_pointer to a virtual
6003 register if DRAP is needed. Local register allocator will replace
6004 virtual_incoming_args_rtx with the virtual register. */
6006 static void
6007 expand_stack_alignment (void)
6009 rtx drap_rtx;
6010 unsigned int preferred_stack_boundary;
6012 if (! SUPPORTS_STACK_ALIGNMENT)
6013 return;
6015 if (cfun->calls_alloca
6016 || cfun->has_nonlocal_label
6017 || crtl->has_nonlocal_goto)
6018 crtl->need_drap = true;
6020 /* Call update_stack_boundary here again to update incoming stack
6021 boundary. It may set incoming stack alignment to a different
6022 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6023 use the minimum incoming stack alignment to check if it is OK
6024 to perform sibcall optimization since sibcall optimization will
6025 only align the outgoing stack to incoming stack boundary. */
6026 if (targetm.calls.update_stack_boundary)
6027 targetm.calls.update_stack_boundary ();
6029 /* The incoming stack frame has to be aligned at least at
6030 parm_stack_boundary. */
6031 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6033 /* Update crtl->stack_alignment_estimated and use it later to align
6034 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6035 exceptions since callgraph doesn't collect incoming stack alignment
6036 in this case. */
6037 if (cfun->can_throw_non_call_exceptions
6038 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6039 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6040 else
6041 preferred_stack_boundary = crtl->preferred_stack_boundary;
6042 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6043 crtl->stack_alignment_estimated = preferred_stack_boundary;
6044 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6045 crtl->stack_alignment_needed = preferred_stack_boundary;
6047 gcc_assert (crtl->stack_alignment_needed
6048 <= crtl->stack_alignment_estimated);
6050 crtl->stack_realign_needed
6051 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6052 crtl->stack_realign_tried = crtl->stack_realign_needed;
6054 crtl->stack_realign_processed = true;
6056 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6057 alignment. */
6058 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6059 drap_rtx = targetm.calls.get_drap_rtx ();
6061 /* stack_realign_drap and drap_rtx must match. */
6062 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6064 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6065 if (NULL != drap_rtx)
6067 crtl->args.internal_arg_pointer = drap_rtx;
6069 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6070 needed. */
6071 fixup_tail_calls ();
6076 static void
6077 expand_main_function (void)
6079 #if (defined(INVOKE__main) \
6080 || (!defined(HAS_INIT_SECTION) \
6081 && !defined(INIT_SECTION_ASM_OP) \
6082 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6083 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode, 0);
6084 #endif
6088 /* Expand code to initialize the stack_protect_guard. This is invoked at
6089 the beginning of a function to be protected. */
6091 static void
6092 stack_protect_prologue (void)
6094 tree guard_decl = targetm.stack_protect_guard ();
6095 rtx x, y;
6097 x = expand_normal (crtl->stack_protect_guard);
6098 if (guard_decl)
6099 y = expand_normal (guard_decl);
6100 else
6101 y = const0_rtx;
6103 /* Allow the target to copy from Y to X without leaking Y into a
6104 register. */
6105 if (targetm.have_stack_protect_set ())
6106 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6108 emit_insn (insn);
6109 return;
6112 /* Otherwise do a straight move. */
6113 emit_move_insn (x, y);
6116 /* Translate the intermediate representation contained in the CFG
6117 from GIMPLE trees to RTL.
6119 We do conversion per basic block and preserve/update the tree CFG.
6120 This implies we have to do some magic as the CFG can simultaneously
6121 consist of basic blocks containing RTL and GIMPLE trees. This can
6122 confuse the CFG hooks, so be careful to not manipulate CFG during
6123 the expansion. */
6125 namespace {
6127 const pass_data pass_data_expand =
6129 RTL_PASS, /* type */
6130 "expand", /* name */
6131 OPTGROUP_NONE, /* optinfo_flags */
6132 TV_EXPAND, /* tv_id */
6133 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6134 | PROP_gimple_lcx
6135 | PROP_gimple_lvec
6136 | PROP_gimple_lva), /* properties_required */
6137 PROP_rtl, /* properties_provided */
6138 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
6139 0, /* todo_flags_start */
6140 0, /* todo_flags_finish */
6143 class pass_expand : public rtl_opt_pass
6145 public:
6146 pass_expand (gcc::context *ctxt)
6147 : rtl_opt_pass (pass_data_expand, ctxt)
6150 /* opt_pass methods: */
6151 virtual unsigned int execute (function *);
6153 }; // class pass_expand
6155 unsigned int
6156 pass_expand::execute (function *fun)
6158 basic_block bb, init_block;
6159 edge_iterator ei;
6160 edge e;
6161 rtx_insn *var_seq, *var_ret_seq;
6162 unsigned i;
6164 timevar_push (TV_OUT_OF_SSA);
6165 rewrite_out_of_ssa (&SA);
6166 timevar_pop (TV_OUT_OF_SSA);
6167 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6169 if (MAY_HAVE_DEBUG_STMTS && flag_tree_ter)
6171 gimple_stmt_iterator gsi;
6172 FOR_EACH_BB_FN (bb, cfun)
6173 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6174 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6175 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6178 /* Make sure all values used by the optimization passes have sane
6179 defaults. */
6180 reg_renumber = 0;
6182 /* Some backends want to know that we are expanding to RTL. */
6183 currently_expanding_to_rtl = 1;
6184 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6185 free_dominance_info (CDI_DOMINATORS);
6187 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6189 if (chkp_function_instrumented_p (current_function_decl))
6190 chkp_reset_rtl_bounds ();
6192 insn_locations_init ();
6193 if (!DECL_IS_BUILTIN (current_function_decl))
6195 /* Eventually, all FEs should explicitly set function_start_locus. */
6196 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6197 set_curr_insn_location
6198 (DECL_SOURCE_LOCATION (current_function_decl));
6199 else
6200 set_curr_insn_location (fun->function_start_locus);
6202 else
6203 set_curr_insn_location (UNKNOWN_LOCATION);
6204 prologue_location = curr_insn_location ();
6206 #ifdef INSN_SCHEDULING
6207 init_sched_attrs ();
6208 #endif
6210 /* Make sure first insn is a note even if we don't want linenums.
6211 This makes sure the first insn will never be deleted.
6212 Also, final expects a note to appear there. */
6213 emit_note (NOTE_INSN_DELETED);
6215 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6216 discover_nonconstant_array_refs ();
6218 targetm.expand_to_rtl_hook ();
6219 crtl->init_stack_alignment ();
6220 fun->cfg->max_jumptable_ents = 0;
6222 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6223 of the function section at exapnsion time to predict distance of calls. */
6224 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6226 /* Expand the variables recorded during gimple lowering. */
6227 timevar_push (TV_VAR_EXPAND);
6228 start_sequence ();
6230 var_ret_seq = expand_used_vars ();
6232 var_seq = get_insns ();
6233 end_sequence ();
6234 timevar_pop (TV_VAR_EXPAND);
6236 /* Honor stack protection warnings. */
6237 if (warn_stack_protect)
6239 if (fun->calls_alloca)
6240 warning (OPT_Wstack_protector,
6241 "stack protector not protecting local variables: "
6242 "variable length buffer");
6243 if (has_short_buffer && !crtl->stack_protect_guard)
6244 warning (OPT_Wstack_protector,
6245 "stack protector not protecting function: "
6246 "all local arrays are less than %d bytes long",
6247 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE));
6250 /* Set up parameters and prepare for return, for the function. */
6251 expand_function_start (current_function_decl);
6253 /* If we emitted any instructions for setting up the variables,
6254 emit them before the FUNCTION_START note. */
6255 if (var_seq)
6257 emit_insn_before (var_seq, parm_birth_insn);
6259 /* In expand_function_end we'll insert the alloca save/restore
6260 before parm_birth_insn. We've just insertted an alloca call.
6261 Adjust the pointer to match. */
6262 parm_birth_insn = var_seq;
6265 /* Now propagate the RTL assignment of each partition to the
6266 underlying var of each SSA_NAME. */
6267 tree name;
6269 FOR_EACH_SSA_NAME (i, name, cfun)
6271 /* We might have generated new SSA names in
6272 update_alias_info_with_stack_vars. They will have a NULL
6273 defining statements, and won't be part of the partitioning,
6274 so ignore those. */
6275 if (!SSA_NAME_DEF_STMT (name))
6276 continue;
6278 adjust_one_expanded_partition_var (name);
6281 /* Clean up RTL of variables that straddle across multiple
6282 partitions, and check that the rtl of any PARM_DECLs that are not
6283 cleaned up is that of their default defs. */
6284 FOR_EACH_SSA_NAME (i, name, cfun)
6286 int part;
6288 /* We might have generated new SSA names in
6289 update_alias_info_with_stack_vars. They will have a NULL
6290 defining statements, and won't be part of the partitioning,
6291 so ignore those. */
6292 if (!SSA_NAME_DEF_STMT (name))
6293 continue;
6294 part = var_to_partition (SA.map, name);
6295 if (part == NO_PARTITION)
6296 continue;
6298 /* If this decl was marked as living in multiple places, reset
6299 this now to NULL. */
6300 tree var = SSA_NAME_VAR (name);
6301 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6302 SET_DECL_RTL (var, NULL);
6303 /* Check that the pseudos chosen by assign_parms are those of
6304 the corresponding default defs. */
6305 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6306 && (TREE_CODE (var) == PARM_DECL
6307 || TREE_CODE (var) == RESULT_DECL))
6309 rtx in = DECL_RTL_IF_SET (var);
6310 gcc_assert (in);
6311 rtx out = SA.partition_to_pseudo[part];
6312 gcc_assert (in == out);
6314 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6315 those expected by debug backends for each parm and for
6316 the result. This is particularly important for stabs,
6317 whose register elimination from parm's DECL_RTL may cause
6318 -fcompare-debug differences as SET_DECL_RTL changes reg's
6319 attrs. So, make sure the RTL already has the parm as the
6320 EXPR, so that it won't change. */
6321 SET_DECL_RTL (var, NULL_RTX);
6322 if (MEM_P (in))
6323 set_mem_attributes (in, var, true);
6324 SET_DECL_RTL (var, in);
6328 /* If this function is `main', emit a call to `__main'
6329 to run global initializers, etc. */
6330 if (DECL_NAME (current_function_decl)
6331 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6332 && DECL_FILE_SCOPE_P (current_function_decl))
6333 expand_main_function ();
6335 /* Initialize the stack_protect_guard field. This must happen after the
6336 call to __main (if any) so that the external decl is initialized. */
6337 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6338 stack_protect_prologue ();
6340 expand_phi_nodes (&SA);
6342 /* Release any stale SSA redirection data. */
6343 redirect_edge_var_map_empty ();
6345 /* Register rtl specific functions for cfg. */
6346 rtl_register_cfg_hooks ();
6348 init_block = construct_init_block ();
6350 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6351 remaining edges later. */
6352 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6353 e->flags &= ~EDGE_EXECUTABLE;
6355 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6356 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6357 next_bb)
6358 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6360 if (MAY_HAVE_DEBUG_INSNS)
6361 expand_debug_locations ();
6363 if (deep_ter_debug_map)
6365 delete deep_ter_debug_map;
6366 deep_ter_debug_map = NULL;
6369 /* Free stuff we no longer need after GIMPLE optimizations. */
6370 free_dominance_info (CDI_DOMINATORS);
6371 free_dominance_info (CDI_POST_DOMINATORS);
6372 delete_tree_cfg_annotations (fun);
6374 timevar_push (TV_OUT_OF_SSA);
6375 finish_out_of_ssa (&SA);
6376 timevar_pop (TV_OUT_OF_SSA);
6378 timevar_push (TV_POST_EXPAND);
6379 /* We are no longer in SSA form. */
6380 fun->gimple_df->in_ssa_p = false;
6381 loops_state_clear (LOOP_CLOSED_SSA);
6383 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6384 conservatively to true until they are all profile aware. */
6385 delete lab_rtx_for_bb;
6386 free_histograms (fun);
6388 construct_exit_block ();
6389 insn_locations_finalize ();
6391 if (var_ret_seq)
6393 rtx_insn *after = return_label;
6394 rtx_insn *next = NEXT_INSN (after);
6395 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6396 after = next;
6397 emit_insn_after (var_ret_seq, after);
6400 /* Zap the tree EH table. */
6401 set_eh_throw_stmt_table (fun, NULL);
6403 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6404 split edges which edge insertions might do. */
6405 rebuild_jump_labels (get_insns ());
6407 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun),
6408 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6410 edge e;
6411 edge_iterator ei;
6412 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6414 if (e->insns.r)
6416 rebuild_jump_labels_chain (e->insns.r);
6417 /* Put insns after parm birth, but before
6418 NOTE_INSNS_FUNCTION_BEG. */
6419 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (fun)
6420 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6422 rtx_insn *insns = e->insns.r;
6423 e->insns.r = NULL;
6424 if (NOTE_P (parm_birth_insn)
6425 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6426 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6427 else
6428 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6430 else
6431 commit_one_edge_insertion (e);
6433 else
6434 ei_next (&ei);
6438 /* We're done expanding trees to RTL. */
6439 currently_expanding_to_rtl = 0;
6441 flush_mark_addressable_queue ();
6443 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6444 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6446 edge e;
6447 edge_iterator ei;
6448 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6450 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6451 e->flags &= ~EDGE_EXECUTABLE;
6453 /* At the moment not all abnormal edges match the RTL
6454 representation. It is safe to remove them here as
6455 find_many_sub_basic_blocks will rediscover them.
6456 In the future we should get this fixed properly. */
6457 if ((e->flags & EDGE_ABNORMAL)
6458 && !(e->flags & EDGE_SIBCALL))
6459 remove_edge (e);
6460 else
6461 ei_next (&ei);
6465 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6466 bitmap_ones (blocks);
6467 find_many_sub_basic_blocks (blocks);
6468 purge_all_dead_edges ();
6470 expand_stack_alignment ();
6472 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6473 function. */
6474 if (crtl->tail_call_emit)
6475 fixup_tail_calls ();
6477 /* After initial rtl generation, call back to finish generating
6478 exception support code. We need to do this before cleaning up
6479 the CFG as the code does not expect dead landing pads. */
6480 if (fun->eh->region_tree != NULL)
6481 finish_eh_generation ();
6483 /* BB subdivision may have created basic blocks that are are only reachable
6484 from unlikely bbs but not marked as such in the profile. */
6485 if (optimize)
6486 propagate_unlikely_bbs_forward ();
6488 /* Remove unreachable blocks, otherwise we cannot compute dominators
6489 which are needed for loop state verification. As a side-effect
6490 this also compacts blocks.
6491 ??? We cannot remove trivially dead insns here as for example
6492 the DRAP reg on i?86 is not magically live at this point.
6493 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6494 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6496 checking_verify_flow_info ();
6498 /* Initialize pseudos allocated for hard registers. */
6499 emit_initial_value_sets ();
6501 /* And finally unshare all RTL. */
6502 unshare_all_rtl ();
6504 /* There's no need to defer outputting this function any more; we
6505 know we want to output it. */
6506 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6508 /* Now that we're done expanding trees to RTL, we shouldn't have any
6509 more CONCATs anywhere. */
6510 generating_concat_p = 0;
6512 if (dump_file)
6514 fprintf (dump_file,
6515 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6516 /* And the pass manager will dump RTL for us. */
6519 /* If we're emitting a nested function, make sure its parent gets
6520 emitted as well. Doing otherwise confuses debug info. */
6522 tree parent;
6523 for (parent = DECL_CONTEXT (current_function_decl);
6524 parent != NULL_TREE;
6525 parent = get_containing_scope (parent))
6526 if (TREE_CODE (parent) == FUNCTION_DECL)
6527 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6530 /* We are now committed to emitting code for this function. Do any
6531 preparation, such as emitting abstract debug info for the inline
6532 before it gets mangled by optimization. */
6533 if (cgraph_function_possibly_inlined_p (current_function_decl))
6534 (*debug_hooks->outlining_inline_function) (current_function_decl);
6536 TREE_ASM_WRITTEN (current_function_decl) = 1;
6538 /* After expanding, the return labels are no longer needed. */
6539 return_label = NULL;
6540 naked_return_label = NULL;
6542 /* After expanding, the tm_restart map is no longer needed. */
6543 if (fun->gimple_df->tm_restart)
6544 fun->gimple_df->tm_restart = NULL;
6546 /* Tag the blocks with a depth number so that change_scope can find
6547 the common parent easily. */
6548 set_block_levels (DECL_INITIAL (fun->decl), 0);
6549 default_rtl_profile ();
6551 /* For -dx discard loops now, otherwise IL verify in clean_state will
6552 ICE. */
6553 if (rtl_dump_and_exit)
6555 cfun->curr_properties &= ~PROP_loops;
6556 loop_optimizer_finalize ();
6559 timevar_pop (TV_POST_EXPAND);
6561 return 0;
6564 } // anon namespace
6566 rtl_opt_pass *
6567 make_pass_expand (gcc::context *ctxt)
6569 return new pass_expand (ctxt);