2015-09-25 Vladimir Makarov <vmakarov@redhat.com>
[official-gcc.git] / gcc / cfgexpand.c
blob6c9284ffc8cb55f5faf047153839b1c8c5d875f6
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2015 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "cfghooks.h"
25 #include "tree.h"
26 #include "gimple.h"
27 #include "rtl.h"
28 #include "ssa.h"
29 #include "alias.h"
30 #include "fold-const.h"
31 #include "varasm.h"
32 #include "stor-layout.h"
33 #include "stmt.h"
34 #include "print-tree.h"
35 #include "tm_p.h"
36 #include "cfgrtl.h"
37 #include "cfganal.h"
38 #include "cfgbuild.h"
39 #include "cfgcleanup.h"
40 #include "insn-codes.h"
41 #include "optabs.h"
42 #include "flags.h"
43 #include "insn-config.h"
44 #include "expmed.h"
45 #include "dojump.h"
46 #include "explow.h"
47 #include "calls.h"
48 #include "emit-rtl.h"
49 #include "expr.h"
50 #include "langhooks.h"
51 #include "internal-fn.h"
52 #include "tree-eh.h"
53 #include "gimple-iterator.h"
54 #include "gimple-walk.h"
55 #include "cgraph.h"
56 #include "tree-cfg.h"
57 #include "tree-dfa.h"
58 #include "tree-ssa.h"
59 #include "tree-pass.h"
60 #include "except.h"
61 #include "diagnostic.h"
62 #include "gimple-pretty-print.h"
63 #include "toplev.h"
64 #include "debug.h"
65 #include "params.h"
66 #include "tree-inline.h"
67 #include "value-prof.h"
68 #include "target.h"
69 #include "tree-ssa-live.h"
70 #include "tree-outof-ssa.h"
71 #include "cfgloop.h"
72 #include "regs.h" /* For reg_renumber. */
73 #include "insn-attr.h" /* For INSN_SCHEDULING. */
74 #include "asan.h"
75 #include "tree-ssa-address.h"
76 #include "recog.h"
77 #include "output.h"
78 #include "builtins.h"
79 #include "tree-chkp.h"
80 #include "rtl-chkp.h"
82 /* Some systems use __main in a way incompatible with its use in gcc, in these
83 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
84 give the same symbol without quotes for an alternative entry point. You
85 must define both, or neither. */
86 #ifndef NAME__MAIN
87 #define NAME__MAIN "__main"
88 #endif
90 /* This variable holds information helping the rewriting of SSA trees
91 into RTL. */
92 struct ssaexpand SA;
94 /* This variable holds the currently expanded gimple statement for purposes
95 of comminucating the profile info to the builtin expanders. */
96 gimple *currently_expanding_gimple_stmt;
98 static rtx expand_debug_expr (tree);
100 static bool defer_stack_allocation (tree, bool);
102 /* Return an expression tree corresponding to the RHS of GIMPLE
103 statement STMT. */
105 tree
106 gimple_assign_rhs_to_tree (gimple *stmt)
108 tree t;
109 enum gimple_rhs_class grhs_class;
111 grhs_class = get_gimple_rhs_class (gimple_expr_code (stmt));
113 if (grhs_class == GIMPLE_TERNARY_RHS)
114 t = build3 (gimple_assign_rhs_code (stmt),
115 TREE_TYPE (gimple_assign_lhs (stmt)),
116 gimple_assign_rhs1 (stmt),
117 gimple_assign_rhs2 (stmt),
118 gimple_assign_rhs3 (stmt));
119 else if (grhs_class == GIMPLE_BINARY_RHS)
120 t = build2 (gimple_assign_rhs_code (stmt),
121 TREE_TYPE (gimple_assign_lhs (stmt)),
122 gimple_assign_rhs1 (stmt),
123 gimple_assign_rhs2 (stmt));
124 else if (grhs_class == GIMPLE_UNARY_RHS)
125 t = build1 (gimple_assign_rhs_code (stmt),
126 TREE_TYPE (gimple_assign_lhs (stmt)),
127 gimple_assign_rhs1 (stmt));
128 else if (grhs_class == GIMPLE_SINGLE_RHS)
130 t = gimple_assign_rhs1 (stmt);
131 /* Avoid modifying this tree in place below. */
132 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
133 && gimple_location (stmt) != EXPR_LOCATION (t))
134 || (gimple_block (stmt)
135 && currently_expanding_to_rtl
136 && EXPR_P (t)))
137 t = copy_node (t);
139 else
140 gcc_unreachable ();
142 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
143 SET_EXPR_LOCATION (t, gimple_location (stmt));
145 return t;
149 #ifndef STACK_ALIGNMENT_NEEDED
150 #define STACK_ALIGNMENT_NEEDED 1
151 #endif
153 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
155 /* Choose either CUR or NEXT as the leader DECL for a partition.
156 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
157 out of the same user variable being in multiple partitions (this is
158 less likely for compiler-introduced temps). */
160 static tree
161 leader_merge (tree cur, tree next)
163 if (cur == NULL || cur == next)
164 return next;
166 if (DECL_P (cur) && DECL_IGNORED_P (cur))
167 return cur;
169 if (DECL_P (next) && DECL_IGNORED_P (next))
170 return next;
172 return cur;
175 /* Return true if VAR is a PARM_DECL or a RESULT_DECL that ought to be
176 assigned to a stack slot. We can't have expand_one_ssa_partition
177 choose their address: the pseudo holding the address would be set
178 up too late for assign_params to copy the parameter if needed.
180 Such parameters are likely passed as a pointer to the value, rather
181 than as a value, and so we must not coalesce them, nor allocate
182 stack space for them before determining the calling conventions for
183 them.
185 For their SSA_NAMEs, expand_one_ssa_partition emits RTL as MEMs
186 with pc_rtx as the address, and then it replaces the pc_rtx with
187 NULL so as to make sure the MEM is not used before it is adjusted
188 in assign_parm_setup_reg. */
190 bool
191 parm_in_stack_slot_p (tree var)
193 if (!var || VAR_P (var))
194 return false;
196 gcc_assert (TREE_CODE (var) == PARM_DECL
197 || TREE_CODE (var) == RESULT_DECL);
199 return !use_register_for_decl (var);
202 /* Return the partition of the default SSA_DEF for decl VAR. */
204 static int
205 ssa_default_def_partition (tree var)
207 tree name = ssa_default_def (cfun, var);
209 if (!name)
210 return NO_PARTITION;
212 return var_to_partition (SA.map, name);
215 /* Return the RTL for the default SSA def of a PARM or RESULT, if
216 there is one. */
219 get_rtl_for_parm_ssa_default_def (tree var)
221 gcc_assert (TREE_CODE (var) == PARM_DECL || TREE_CODE (var) == RESULT_DECL);
223 if (!is_gimple_reg (var))
224 return NULL_RTX;
226 /* If we've already determined RTL for the decl, use it. This is
227 not just an optimization: if VAR is a PARM whose incoming value
228 is unused, we won't find a default def to use its partition, but
229 we still want to use the location of the parm, if it was used at
230 all. During assign_parms, until a location is assigned for the
231 VAR, RTL can only for a parm or result if we're not coalescing
232 across variables, when we know we're coalescing all SSA_NAMEs of
233 each parm or result, and we're not coalescing them with names
234 pertaining to other variables, such as other parms' default
235 defs. */
236 if (DECL_RTL_SET_P (var))
238 gcc_assert (DECL_RTL (var) != pc_rtx);
239 return DECL_RTL (var);
242 int part = ssa_default_def_partition (var);
243 if (part == NO_PARTITION)
244 return NULL_RTX;
246 return SA.partition_to_pseudo[part];
249 /* Associate declaration T with storage space X. If T is no
250 SSA name this is exactly SET_DECL_RTL, otherwise make the
251 partition of T associated with X. */
252 static inline void
253 set_rtl (tree t, rtx x)
255 if (x && SSAVAR (t))
257 bool skip = false;
258 tree cur = NULL_TREE;
260 if (MEM_P (x))
261 cur = MEM_EXPR (x);
262 else if (REG_P (x))
263 cur = REG_EXPR (x);
264 else if (GET_CODE (x) == CONCAT
265 && REG_P (XEXP (x, 0)))
266 cur = REG_EXPR (XEXP (x, 0));
267 else if (GET_CODE (x) == PARALLEL)
268 cur = REG_EXPR (XVECEXP (x, 0, 0));
269 else if (x == pc_rtx)
270 skip = true;
271 else
272 gcc_unreachable ();
274 tree next = skip ? cur : leader_merge (cur, SSAVAR (t));
276 if (cur != next)
278 if (MEM_P (x))
279 set_mem_attributes (x, next, true);
280 else
281 set_reg_attrs_for_decl_rtl (next, x);
285 if (TREE_CODE (t) == SSA_NAME)
287 int part = var_to_partition (SA.map, t);
288 if (part != NO_PARTITION)
290 if (SA.partition_to_pseudo[part])
291 gcc_assert (SA.partition_to_pseudo[part] == x);
292 else if (x != pc_rtx)
293 SA.partition_to_pseudo[part] = x;
295 /* For the benefit of debug information at -O0 (where
296 vartracking doesn't run) record the place also in the base
297 DECL. For PARMs and RESULTs, we may end up resetting these
298 in function.c:maybe_reset_rtl_for_parm, but in some rare
299 cases we may need them (unused and overwritten incoming
300 value, that at -O0 must share the location with the other
301 uses in spite of the missing default def), and this may be
302 the only chance to preserve them. */
303 if (x && x != pc_rtx && SSA_NAME_VAR (t))
305 tree var = SSA_NAME_VAR (t);
306 /* If we don't yet have something recorded, just record it now. */
307 if (!DECL_RTL_SET_P (var))
308 SET_DECL_RTL (var, x);
309 /* If we have it set already to "multiple places" don't
310 change this. */
311 else if (DECL_RTL (var) == pc_rtx)
313 /* If we have something recorded and it's not the same place
314 as we want to record now, we have multiple partitions for the
315 same base variable, with different places. We can't just
316 randomly chose one, hence we have to say that we don't know.
317 This only happens with optimization, and there var-tracking
318 will figure out the right thing. */
319 else if (DECL_RTL (var) != x)
320 SET_DECL_RTL (var, pc_rtx);
323 else
324 SET_DECL_RTL (t, x);
327 /* This structure holds data relevant to one variable that will be
328 placed in a stack slot. */
329 struct stack_var
331 /* The Variable. */
332 tree decl;
334 /* Initially, the size of the variable. Later, the size of the partition,
335 if this variable becomes it's partition's representative. */
336 HOST_WIDE_INT size;
338 /* The *byte* alignment required for this variable. Or as, with the
339 size, the alignment for this partition. */
340 unsigned int alignb;
342 /* The partition representative. */
343 size_t representative;
345 /* The next stack variable in the partition, or EOC. */
346 size_t next;
348 /* The numbers of conflicting stack variables. */
349 bitmap conflicts;
352 #define EOC ((size_t)-1)
354 /* We have an array of such objects while deciding allocation. */
355 static struct stack_var *stack_vars;
356 static size_t stack_vars_alloc;
357 static size_t stack_vars_num;
358 static hash_map<tree, size_t> *decl_to_stack_part;
360 /* Conflict bitmaps go on this obstack. This allows us to destroy
361 all of them in one big sweep. */
362 static bitmap_obstack stack_var_bitmap_obstack;
364 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
365 is non-decreasing. */
366 static size_t *stack_vars_sorted;
368 /* The phase of the stack frame. This is the known misalignment of
369 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
370 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
371 static int frame_phase;
373 /* Used during expand_used_vars to remember if we saw any decls for
374 which we'd like to enable stack smashing protection. */
375 static bool has_protected_decls;
377 /* Used during expand_used_vars. Remember if we say a character buffer
378 smaller than our cutoff threshold. Used for -Wstack-protector. */
379 static bool has_short_buffer;
381 /* Compute the byte alignment to use for DECL. Ignore alignment
382 we can't do with expected alignment of the stack boundary. */
384 static unsigned int
385 align_local_variable (tree decl)
387 unsigned int align;
389 if (TREE_CODE (decl) == SSA_NAME)
390 align = TYPE_ALIGN (TREE_TYPE (decl));
391 else
393 align = LOCAL_DECL_ALIGNMENT (decl);
394 DECL_ALIGN (decl) = align;
396 return align / BITS_PER_UNIT;
399 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
400 down otherwise. Return truncated BASE value. */
402 static inline unsigned HOST_WIDE_INT
403 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
405 return align_up ? (base + align - 1) & -align : base & -align;
408 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
409 Return the frame offset. */
411 static HOST_WIDE_INT
412 alloc_stack_frame_space (HOST_WIDE_INT size, unsigned HOST_WIDE_INT align)
414 HOST_WIDE_INT offset, new_frame_offset;
416 if (FRAME_GROWS_DOWNWARD)
418 new_frame_offset
419 = align_base (frame_offset - frame_phase - size,
420 align, false) + frame_phase;
421 offset = new_frame_offset;
423 else
425 new_frame_offset
426 = align_base (frame_offset - frame_phase, align, true) + frame_phase;
427 offset = new_frame_offset;
428 new_frame_offset += size;
430 frame_offset = new_frame_offset;
432 if (frame_offset_overflow (frame_offset, cfun->decl))
433 frame_offset = offset = 0;
435 return offset;
438 /* Accumulate DECL into STACK_VARS. */
440 static void
441 add_stack_var (tree decl)
443 struct stack_var *v;
445 if (stack_vars_num >= stack_vars_alloc)
447 if (stack_vars_alloc)
448 stack_vars_alloc = stack_vars_alloc * 3 / 2;
449 else
450 stack_vars_alloc = 32;
451 stack_vars
452 = XRESIZEVEC (struct stack_var, stack_vars, stack_vars_alloc);
454 if (!decl_to_stack_part)
455 decl_to_stack_part = new hash_map<tree, size_t>;
457 v = &stack_vars[stack_vars_num];
458 decl_to_stack_part->put (decl, stack_vars_num);
460 v->decl = decl;
461 tree size = TREE_CODE (decl) == SSA_NAME
462 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
463 : DECL_SIZE_UNIT (decl);
464 v->size = tree_to_uhwi (size);
465 /* Ensure that all variables have size, so that &a != &b for any two
466 variables that are simultaneously live. */
467 if (v->size == 0)
468 v->size = 1;
469 v->alignb = align_local_variable (decl);
470 /* An alignment of zero can mightily confuse us later. */
471 gcc_assert (v->alignb != 0);
473 /* All variables are initially in their own partition. */
474 v->representative = stack_vars_num;
475 v->next = EOC;
477 /* All variables initially conflict with no other. */
478 v->conflicts = NULL;
480 /* Ensure that this decl doesn't get put onto the list twice. */
481 set_rtl (decl, pc_rtx);
483 stack_vars_num++;
486 /* Make the decls associated with luid's X and Y conflict. */
488 static void
489 add_stack_var_conflict (size_t x, size_t y)
491 struct stack_var *a = &stack_vars[x];
492 struct stack_var *b = &stack_vars[y];
493 if (!a->conflicts)
494 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
495 if (!b->conflicts)
496 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
497 bitmap_set_bit (a->conflicts, y);
498 bitmap_set_bit (b->conflicts, x);
501 /* Check whether the decls associated with luid's X and Y conflict. */
503 static bool
504 stack_var_conflict_p (size_t x, size_t y)
506 struct stack_var *a = &stack_vars[x];
507 struct stack_var *b = &stack_vars[y];
508 if (x == y)
509 return false;
510 /* Partitions containing an SSA name result from gimple registers
511 with things like unsupported modes. They are top-level and
512 hence conflict with everything else. */
513 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
514 return true;
516 if (!a->conflicts || !b->conflicts)
517 return false;
518 return bitmap_bit_p (a->conflicts, y);
521 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
522 enter its partition number into bitmap DATA. */
524 static bool
525 visit_op (gimple *, tree op, tree, void *data)
527 bitmap active = (bitmap)data;
528 op = get_base_address (op);
529 if (op
530 && DECL_P (op)
531 && DECL_RTL_IF_SET (op) == pc_rtx)
533 size_t *v = decl_to_stack_part->get (op);
534 if (v)
535 bitmap_set_bit (active, *v);
537 return false;
540 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
541 record conflicts between it and all currently active other partitions
542 from bitmap DATA. */
544 static bool
545 visit_conflict (gimple *, tree op, tree, void *data)
547 bitmap active = (bitmap)data;
548 op = get_base_address (op);
549 if (op
550 && DECL_P (op)
551 && DECL_RTL_IF_SET (op) == pc_rtx)
553 size_t *v = decl_to_stack_part->get (op);
554 if (v && bitmap_set_bit (active, *v))
556 size_t num = *v;
557 bitmap_iterator bi;
558 unsigned i;
559 gcc_assert (num < stack_vars_num);
560 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
561 add_stack_var_conflict (num, i);
564 return false;
567 /* Helper routine for add_scope_conflicts, calculating the active partitions
568 at the end of BB, leaving the result in WORK. We're called to generate
569 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
570 liveness. */
572 static void
573 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
575 edge e;
576 edge_iterator ei;
577 gimple_stmt_iterator gsi;
578 walk_stmt_load_store_addr_fn visit;
580 bitmap_clear (work);
581 FOR_EACH_EDGE (e, ei, bb->preds)
582 bitmap_ior_into (work, (bitmap)e->src->aux);
584 visit = visit_op;
586 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
588 gimple *stmt = gsi_stmt (gsi);
589 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
591 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
593 gimple *stmt = gsi_stmt (gsi);
595 if (gimple_clobber_p (stmt))
597 tree lhs = gimple_assign_lhs (stmt);
598 size_t *v;
599 /* Nested function lowering might introduce LHSs
600 that are COMPONENT_REFs. */
601 if (TREE_CODE (lhs) != VAR_DECL)
602 continue;
603 if (DECL_RTL_IF_SET (lhs) == pc_rtx
604 && (v = decl_to_stack_part->get (lhs)))
605 bitmap_clear_bit (work, *v);
607 else if (!is_gimple_debug (stmt))
609 if (for_conflict
610 && visit == visit_op)
612 /* If this is the first real instruction in this BB we need
613 to add conflicts for everything live at this point now.
614 Unlike classical liveness for named objects we can't
615 rely on seeing a def/use of the names we're interested in.
616 There might merely be indirect loads/stores. We'd not add any
617 conflicts for such partitions. */
618 bitmap_iterator bi;
619 unsigned i;
620 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
622 struct stack_var *a = &stack_vars[i];
623 if (!a->conflicts)
624 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
625 bitmap_ior_into (a->conflicts, work);
627 visit = visit_conflict;
629 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
634 /* Generate stack partition conflicts between all partitions that are
635 simultaneously live. */
637 static void
638 add_scope_conflicts (void)
640 basic_block bb;
641 bool changed;
642 bitmap work = BITMAP_ALLOC (NULL);
643 int *rpo;
644 int n_bbs;
646 /* We approximate the live range of a stack variable by taking the first
647 mention of its name as starting point(s), and by the end-of-scope
648 death clobber added by gimplify as ending point(s) of the range.
649 This overapproximates in the case we for instance moved an address-taken
650 operation upward, without also moving a dereference to it upwards.
651 But it's conservatively correct as a variable never can hold values
652 before its name is mentioned at least once.
654 We then do a mostly classical bitmap liveness algorithm. */
656 FOR_ALL_BB_FN (bb, cfun)
657 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
659 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
660 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
662 changed = true;
663 while (changed)
665 int i;
666 changed = false;
667 for (i = 0; i < n_bbs; i++)
669 bitmap active;
670 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
671 active = (bitmap)bb->aux;
672 add_scope_conflicts_1 (bb, work, false);
673 if (bitmap_ior_into (active, work))
674 changed = true;
678 FOR_EACH_BB_FN (bb, cfun)
679 add_scope_conflicts_1 (bb, work, true);
681 free (rpo);
682 BITMAP_FREE (work);
683 FOR_ALL_BB_FN (bb, cfun)
684 BITMAP_FREE (bb->aux);
687 /* A subroutine of partition_stack_vars. A comparison function for qsort,
688 sorting an array of indices by the properties of the object. */
690 static int
691 stack_var_cmp (const void *a, const void *b)
693 size_t ia = *(const size_t *)a;
694 size_t ib = *(const size_t *)b;
695 unsigned int aligna = stack_vars[ia].alignb;
696 unsigned int alignb = stack_vars[ib].alignb;
697 HOST_WIDE_INT sizea = stack_vars[ia].size;
698 HOST_WIDE_INT sizeb = stack_vars[ib].size;
699 tree decla = stack_vars[ia].decl;
700 tree declb = stack_vars[ib].decl;
701 bool largea, largeb;
702 unsigned int uida, uidb;
704 /* Primary compare on "large" alignment. Large comes first. */
705 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
706 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
707 if (largea != largeb)
708 return (int)largeb - (int)largea;
710 /* Secondary compare on size, decreasing */
711 if (sizea > sizeb)
712 return -1;
713 if (sizea < sizeb)
714 return 1;
716 /* Tertiary compare on true alignment, decreasing. */
717 if (aligna < alignb)
718 return -1;
719 if (aligna > alignb)
720 return 1;
722 /* Final compare on ID for sort stability, increasing.
723 Two SSA names are compared by their version, SSA names come before
724 non-SSA names, and two normal decls are compared by their DECL_UID. */
725 if (TREE_CODE (decla) == SSA_NAME)
727 if (TREE_CODE (declb) == SSA_NAME)
728 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
729 else
730 return -1;
732 else if (TREE_CODE (declb) == SSA_NAME)
733 return 1;
734 else
735 uida = DECL_UID (decla), uidb = DECL_UID (declb);
736 if (uida < uidb)
737 return 1;
738 if (uida > uidb)
739 return -1;
740 return 0;
743 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
744 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
746 /* If the points-to solution *PI points to variables that are in a partition
747 together with other variables add all partition members to the pointed-to
748 variables bitmap. */
750 static void
751 add_partitioned_vars_to_ptset (struct pt_solution *pt,
752 part_hashmap *decls_to_partitions,
753 hash_set<bitmap> *visited, bitmap temp)
755 bitmap_iterator bi;
756 unsigned i;
757 bitmap *part;
759 if (pt->anything
760 || pt->vars == NULL
761 /* The pointed-to vars bitmap is shared, it is enough to
762 visit it once. */
763 || visited->add (pt->vars))
764 return;
766 bitmap_clear (temp);
768 /* By using a temporary bitmap to store all members of the partitions
769 we have to add we make sure to visit each of the partitions only
770 once. */
771 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
772 if ((!temp
773 || !bitmap_bit_p (temp, i))
774 && (part = decls_to_partitions->get (i)))
775 bitmap_ior_into (temp, *part);
776 if (!bitmap_empty_p (temp))
777 bitmap_ior_into (pt->vars, temp);
780 /* Update points-to sets based on partition info, so we can use them on RTL.
781 The bitmaps representing stack partitions will be saved until expand,
782 where partitioned decls used as bases in memory expressions will be
783 rewritten. */
785 static void
786 update_alias_info_with_stack_vars (void)
788 part_hashmap *decls_to_partitions = NULL;
789 size_t i, j;
790 tree var = NULL_TREE;
792 for (i = 0; i < stack_vars_num; i++)
794 bitmap part = NULL;
795 tree name;
796 struct ptr_info_def *pi;
798 /* Not interested in partitions with single variable. */
799 if (stack_vars[i].representative != i
800 || stack_vars[i].next == EOC)
801 continue;
803 if (!decls_to_partitions)
805 decls_to_partitions = new part_hashmap;
806 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
809 /* Create an SSA_NAME that points to the partition for use
810 as base during alias-oracle queries on RTL for bases that
811 have been partitioned. */
812 if (var == NULL_TREE)
813 var = create_tmp_var (ptr_type_node);
814 name = make_ssa_name (var);
816 /* Create bitmaps representing partitions. They will be used for
817 points-to sets later, so use GGC alloc. */
818 part = BITMAP_GGC_ALLOC ();
819 for (j = i; j != EOC; j = stack_vars[j].next)
821 tree decl = stack_vars[j].decl;
822 unsigned int uid = DECL_PT_UID (decl);
823 bitmap_set_bit (part, uid);
824 decls_to_partitions->put (uid, part);
825 cfun->gimple_df->decls_to_pointers->put (decl, name);
826 if (TREE_ADDRESSABLE (decl))
827 TREE_ADDRESSABLE (name) = 1;
830 /* Make the SSA name point to all partition members. */
831 pi = get_ptr_info (name);
832 pt_solution_set (&pi->pt, part, false);
835 /* Make all points-to sets that contain one member of a partition
836 contain all members of the partition. */
837 if (decls_to_partitions)
839 unsigned i;
840 hash_set<bitmap> visited;
841 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
843 for (i = 1; i < num_ssa_names; i++)
845 tree name = ssa_name (i);
846 struct ptr_info_def *pi;
848 if (name
849 && POINTER_TYPE_P (TREE_TYPE (name))
850 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
851 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
852 &visited, temp);
855 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
856 decls_to_partitions, &visited, temp);
858 delete decls_to_partitions;
859 BITMAP_FREE (temp);
863 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
864 partitioning algorithm. Partitions A and B are known to be non-conflicting.
865 Merge them into a single partition A. */
867 static void
868 union_stack_vars (size_t a, size_t b)
870 struct stack_var *vb = &stack_vars[b];
871 bitmap_iterator bi;
872 unsigned u;
874 gcc_assert (stack_vars[b].next == EOC);
875 /* Add B to A's partition. */
876 stack_vars[b].next = stack_vars[a].next;
877 stack_vars[b].representative = a;
878 stack_vars[a].next = b;
880 /* Update the required alignment of partition A to account for B. */
881 if (stack_vars[a].alignb < stack_vars[b].alignb)
882 stack_vars[a].alignb = stack_vars[b].alignb;
884 /* Update the interference graph and merge the conflicts. */
885 if (vb->conflicts)
887 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
888 add_stack_var_conflict (a, stack_vars[u].representative);
889 BITMAP_FREE (vb->conflicts);
893 /* A subroutine of expand_used_vars. Binpack the variables into
894 partitions constrained by the interference graph. The overall
895 algorithm used is as follows:
897 Sort the objects by size in descending order.
898 For each object A {
899 S = size(A)
900 O = 0
901 loop {
902 Look for the largest non-conflicting object B with size <= S.
903 UNION (A, B)
908 static void
909 partition_stack_vars (void)
911 size_t si, sj, n = stack_vars_num;
913 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
914 for (si = 0; si < n; ++si)
915 stack_vars_sorted[si] = si;
917 if (n == 1)
918 return;
920 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
922 for (si = 0; si < n; ++si)
924 size_t i = stack_vars_sorted[si];
925 unsigned int ialign = stack_vars[i].alignb;
926 HOST_WIDE_INT isize = stack_vars[i].size;
928 /* Ignore objects that aren't partition representatives. If we
929 see a var that is not a partition representative, it must
930 have been merged earlier. */
931 if (stack_vars[i].representative != i)
932 continue;
934 for (sj = si + 1; sj < n; ++sj)
936 size_t j = stack_vars_sorted[sj];
937 unsigned int jalign = stack_vars[j].alignb;
938 HOST_WIDE_INT jsize = stack_vars[j].size;
940 /* Ignore objects that aren't partition representatives. */
941 if (stack_vars[j].representative != j)
942 continue;
944 /* Do not mix objects of "small" (supported) alignment
945 and "large" (unsupported) alignment. */
946 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
947 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
948 break;
950 /* For Address Sanitizer do not mix objects with different
951 sizes, as the shorter vars wouldn't be adequately protected.
952 Don't do that for "large" (unsupported) alignment objects,
953 those aren't protected anyway. */
954 if ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK && isize != jsize
955 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
956 break;
958 /* Ignore conflicting objects. */
959 if (stack_var_conflict_p (i, j))
960 continue;
962 /* UNION the objects, placing J at OFFSET. */
963 union_stack_vars (i, j);
967 update_alias_info_with_stack_vars ();
970 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
972 static void
973 dump_stack_var_partition (void)
975 size_t si, i, j, n = stack_vars_num;
977 for (si = 0; si < n; ++si)
979 i = stack_vars_sorted[si];
981 /* Skip variables that aren't partition representatives, for now. */
982 if (stack_vars[i].representative != i)
983 continue;
985 fprintf (dump_file, "Partition %lu: size " HOST_WIDE_INT_PRINT_DEC
986 " align %u\n", (unsigned long) i, stack_vars[i].size,
987 stack_vars[i].alignb);
989 for (j = i; j != EOC; j = stack_vars[j].next)
991 fputc ('\t', dump_file);
992 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
994 fputc ('\n', dump_file);
998 /* Assign rtl to DECL at BASE + OFFSET. */
1000 static void
1001 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
1002 HOST_WIDE_INT offset)
1004 unsigned align;
1005 rtx x;
1007 /* If this fails, we've overflowed the stack frame. Error nicely? */
1008 gcc_assert (offset == trunc_int_for_mode (offset, Pmode));
1010 x = plus_constant (Pmode, base, offset);
1011 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
1012 ? TYPE_MODE (TREE_TYPE (decl))
1013 : DECL_MODE (SSAVAR (decl)), x);
1015 if (TREE_CODE (decl) != SSA_NAME)
1017 /* Set alignment we actually gave this decl if it isn't an SSA name.
1018 If it is we generate stack slots only accidentally so it isn't as
1019 important, we'll simply use the alignment that is already set. */
1020 if (base == virtual_stack_vars_rtx)
1021 offset -= frame_phase;
1022 align = offset & -offset;
1023 align *= BITS_PER_UNIT;
1024 if (align == 0 || align > base_align)
1025 align = base_align;
1027 /* One would think that we could assert that we're not decreasing
1028 alignment here, but (at least) the i386 port does exactly this
1029 via the MINIMUM_ALIGNMENT hook. */
1031 DECL_ALIGN (decl) = align;
1032 DECL_USER_ALIGN (decl) = 0;
1035 set_rtl (decl, x);
1038 struct stack_vars_data
1040 /* Vector of offset pairs, always end of some padding followed
1041 by start of the padding that needs Address Sanitizer protection.
1042 The vector is in reversed, highest offset pairs come first. */
1043 vec<HOST_WIDE_INT> asan_vec;
1045 /* Vector of partition representative decls in between the paddings. */
1046 vec<tree> asan_decl_vec;
1048 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1049 rtx asan_base;
1051 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1052 unsigned int asan_alignb;
1055 /* A subroutine of expand_used_vars. Give each partition representative
1056 a unique location within the stack frame. Update each partition member
1057 with that location. */
1059 static void
1060 expand_stack_vars (bool (*pred) (size_t), struct stack_vars_data *data)
1062 size_t si, i, j, n = stack_vars_num;
1063 HOST_WIDE_INT large_size = 0, large_alloc = 0;
1064 rtx large_base = NULL;
1065 unsigned large_align = 0;
1066 tree decl;
1068 /* Determine if there are any variables requiring "large" alignment.
1069 Since these are dynamically allocated, we only process these if
1070 no predicate involved. */
1071 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1072 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1074 /* Find the total size of these variables. */
1075 for (si = 0; si < n; ++si)
1077 unsigned alignb;
1079 i = stack_vars_sorted[si];
1080 alignb = stack_vars[i].alignb;
1082 /* All "large" alignment decls come before all "small" alignment
1083 decls, but "large" alignment decls are not sorted based on
1084 their alignment. Increase large_align to track the largest
1085 required alignment. */
1086 if ((alignb * BITS_PER_UNIT) > large_align)
1087 large_align = alignb * BITS_PER_UNIT;
1089 /* Stop when we get to the first decl with "small" alignment. */
1090 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1091 break;
1093 /* Skip variables that aren't partition representatives. */
1094 if (stack_vars[i].representative != i)
1095 continue;
1097 /* Skip variables that have already had rtl assigned. See also
1098 add_stack_var where we perpetrate this pc_rtx hack. */
1099 decl = stack_vars[i].decl;
1100 if (TREE_CODE (decl) == SSA_NAME
1101 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1102 : DECL_RTL (decl) != pc_rtx)
1103 continue;
1105 large_size += alignb - 1;
1106 large_size &= -(HOST_WIDE_INT)alignb;
1107 large_size += stack_vars[i].size;
1110 /* If there were any, allocate space. */
1111 if (large_size > 0)
1112 large_base = allocate_dynamic_stack_space (GEN_INT (large_size), 0,
1113 large_align, true);
1116 for (si = 0; si < n; ++si)
1118 rtx base;
1119 unsigned base_align, alignb;
1120 HOST_WIDE_INT offset;
1122 i = stack_vars_sorted[si];
1124 /* Skip variables that aren't partition representatives, for now. */
1125 if (stack_vars[i].representative != i)
1126 continue;
1128 /* Skip variables that have already had rtl assigned. See also
1129 add_stack_var where we perpetrate this pc_rtx hack. */
1130 decl = stack_vars[i].decl;
1131 if (TREE_CODE (decl) == SSA_NAME
1132 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1133 : DECL_RTL (decl) != pc_rtx)
1134 continue;
1136 /* Check the predicate to see whether this variable should be
1137 allocated in this pass. */
1138 if (pred && !pred (i))
1139 continue;
1141 alignb = stack_vars[i].alignb;
1142 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1144 base = virtual_stack_vars_rtx;
1145 if ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK && pred)
1147 HOST_WIDE_INT prev_offset
1148 = align_base (frame_offset,
1149 MAX (alignb, ASAN_RED_ZONE_SIZE),
1150 FRAME_GROWS_DOWNWARD);
1151 tree repr_decl = NULL_TREE;
1152 offset
1153 = alloc_stack_frame_space (stack_vars[i].size
1154 + ASAN_RED_ZONE_SIZE,
1155 MAX (alignb, ASAN_RED_ZONE_SIZE));
1157 data->asan_vec.safe_push (prev_offset);
1158 data->asan_vec.safe_push (offset + stack_vars[i].size);
1159 /* Find best representative of the partition.
1160 Prefer those with DECL_NAME, even better
1161 satisfying asan_protect_stack_decl predicate. */
1162 for (j = i; j != EOC; j = stack_vars[j].next)
1163 if (asan_protect_stack_decl (stack_vars[j].decl)
1164 && DECL_NAME (stack_vars[j].decl))
1166 repr_decl = stack_vars[j].decl;
1167 break;
1169 else if (repr_decl == NULL_TREE
1170 && DECL_P (stack_vars[j].decl)
1171 && DECL_NAME (stack_vars[j].decl))
1172 repr_decl = stack_vars[j].decl;
1173 if (repr_decl == NULL_TREE)
1174 repr_decl = stack_vars[i].decl;
1175 data->asan_decl_vec.safe_push (repr_decl);
1176 data->asan_alignb = MAX (data->asan_alignb, alignb);
1177 if (data->asan_base == NULL)
1178 data->asan_base = gen_reg_rtx (Pmode);
1179 base = data->asan_base;
1181 if (!STRICT_ALIGNMENT)
1182 base_align = crtl->max_used_stack_slot_alignment;
1183 else
1184 base_align = MAX (crtl->max_used_stack_slot_alignment,
1185 GET_MODE_ALIGNMENT (SImode)
1186 << ASAN_SHADOW_SHIFT);
1188 else
1190 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1191 base_align = crtl->max_used_stack_slot_alignment;
1194 else
1196 /* Large alignment is only processed in the last pass. */
1197 if (pred)
1198 continue;
1199 gcc_assert (large_base != NULL);
1201 large_alloc += alignb - 1;
1202 large_alloc &= -(HOST_WIDE_INT)alignb;
1203 offset = large_alloc;
1204 large_alloc += stack_vars[i].size;
1206 base = large_base;
1207 base_align = large_align;
1210 /* Create rtl for each variable based on their location within the
1211 partition. */
1212 for (j = i; j != EOC; j = stack_vars[j].next)
1214 expand_one_stack_var_at (stack_vars[j].decl,
1215 base, base_align,
1216 offset);
1220 gcc_assert (large_alloc == large_size);
1223 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1224 static HOST_WIDE_INT
1225 account_stack_vars (void)
1227 size_t si, j, i, n = stack_vars_num;
1228 HOST_WIDE_INT size = 0;
1230 for (si = 0; si < n; ++si)
1232 i = stack_vars_sorted[si];
1234 /* Skip variables that aren't partition representatives, for now. */
1235 if (stack_vars[i].representative != i)
1236 continue;
1238 size += stack_vars[i].size;
1239 for (j = i; j != EOC; j = stack_vars[j].next)
1240 set_rtl (stack_vars[j].decl, NULL);
1242 return size;
1245 /* A subroutine of expand_one_var. Called to immediately assign rtl
1246 to a variable to be allocated in the stack frame. */
1248 static void
1249 expand_one_stack_var_1 (tree var)
1251 HOST_WIDE_INT size, offset;
1252 unsigned byte_align;
1254 if (TREE_CODE (var) == SSA_NAME)
1256 tree type = TREE_TYPE (var);
1257 size = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1258 byte_align = TYPE_ALIGN_UNIT (type);
1260 else
1262 size = tree_to_uhwi (DECL_SIZE_UNIT (var));
1263 byte_align = align_local_variable (var);
1266 /* We handle highly aligned variables in expand_stack_vars. */
1267 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1269 offset = alloc_stack_frame_space (size, byte_align);
1271 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1272 crtl->max_used_stack_slot_alignment, offset);
1275 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1276 already assigned some MEM. */
1278 static void
1279 expand_one_stack_var (tree var)
1281 if (TREE_CODE (var) == SSA_NAME)
1283 int part = var_to_partition (SA.map, var);
1284 if (part != NO_PARTITION)
1286 rtx x = SA.partition_to_pseudo[part];
1287 gcc_assert (x);
1288 gcc_assert (MEM_P (x));
1289 return;
1293 return expand_one_stack_var_1 (var);
1296 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1297 that will reside in a hard register. */
1299 static void
1300 expand_one_hard_reg_var (tree var)
1302 rest_of_decl_compilation (var, 0, 0);
1305 /* Record the alignment requirements of some variable assigned to a
1306 pseudo. */
1308 static void
1309 record_alignment_for_reg_var (unsigned int align)
1311 if (SUPPORTS_STACK_ALIGNMENT
1312 && crtl->stack_alignment_estimated < align)
1314 /* stack_alignment_estimated shouldn't change after stack
1315 realign decision made */
1316 gcc_assert (!crtl->stack_realign_processed);
1317 crtl->stack_alignment_estimated = align;
1320 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1321 So here we only make sure stack_alignment_needed >= align. */
1322 if (crtl->stack_alignment_needed < align)
1323 crtl->stack_alignment_needed = align;
1324 if (crtl->max_used_stack_slot_alignment < align)
1325 crtl->max_used_stack_slot_alignment = align;
1328 /* Create RTL for an SSA partition. */
1330 static void
1331 expand_one_ssa_partition (tree var)
1333 int part = var_to_partition (SA.map, var);
1334 gcc_assert (part != NO_PARTITION);
1336 if (SA.partition_to_pseudo[part])
1337 return;
1339 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1340 TYPE_MODE (TREE_TYPE (var)),
1341 TYPE_ALIGN (TREE_TYPE (var)));
1343 /* If the variable alignment is very large we'll dynamicaly allocate
1344 it, which means that in-frame portion is just a pointer. */
1345 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1346 align = POINTER_SIZE;
1348 record_alignment_for_reg_var (align);
1350 if (!use_register_for_decl (var))
1352 /* We can't risk having the parm assigned to a MEM location
1353 whose address references a pseudo, for the pseudo will only
1354 be set up after arguments are copied to the stack slot.
1356 If the parm doesn't have a default def (e.g., because its
1357 incoming value is unused), then we want to let assign_params
1358 do the allocation, too. In this case we want to make sure
1359 SSA_NAMEs associated with the parm don't get assigned to more
1360 than one partition, lest we'd create two unassigned stac
1361 slots for the same parm, thus the assert at the end of the
1362 block. */
1363 if (parm_in_stack_slot_p (SSA_NAME_VAR (var))
1364 && (ssa_default_def_partition (SSA_NAME_VAR (var)) == part
1365 || !ssa_default_def (cfun, SSA_NAME_VAR (var))))
1367 expand_one_stack_var_at (var, pc_rtx, 0, 0);
1368 rtx x = SA.partition_to_pseudo[part];
1369 gcc_assert (GET_CODE (x) == MEM);
1370 gcc_assert (XEXP (x, 0) == pc_rtx);
1371 /* Reset the address, so that any attempt to use it will
1372 ICE. It will be adjusted in assign_parm_setup_reg. */
1373 XEXP (x, 0) = NULL_RTX;
1374 /* If the RTL associated with the parm is not what we have
1375 just created, the parm has been split over multiple
1376 partitions. In order for this to work, we must have a
1377 default def for the parm, otherwise assign_params won't
1378 know what to do. */
1379 gcc_assert (DECL_RTL_IF_SET (SSA_NAME_VAR (var)) == x
1380 || ssa_default_def (cfun, SSA_NAME_VAR (var)));
1382 else if (defer_stack_allocation (var, true))
1383 add_stack_var (var);
1384 else
1385 expand_one_stack_var_1 (var);
1386 return;
1389 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1391 rtx x = gen_reg_rtx (reg_mode);
1393 set_rtl (var, x);
1396 /* Record the association between the RTL generated for a partition
1397 and the underlying variable of the SSA_NAME. */
1399 static void
1400 adjust_one_expanded_partition_var (tree var)
1402 if (!var)
1403 return;
1405 tree decl = SSA_NAME_VAR (var);
1407 int part = var_to_partition (SA.map, var);
1408 if (part == NO_PARTITION)
1409 return;
1411 rtx x = SA.partition_to_pseudo[part];
1413 if (!x)
1415 /* This var will get a stack slot later. */
1416 gcc_assert (defer_stack_allocation (var, true));
1417 return;
1420 set_rtl (var, x);
1422 if (!REG_P (x))
1423 return;
1425 /* Note if the object is a user variable. */
1426 if (decl && !DECL_ARTIFICIAL (decl))
1427 mark_user_reg (x);
1429 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1430 mark_reg_pointer (x, get_pointer_alignment (var));
1433 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1434 that will reside in a pseudo register. */
1436 static void
1437 expand_one_register_var (tree var)
1439 if (TREE_CODE (var) == SSA_NAME)
1441 int part = var_to_partition (SA.map, var);
1442 if (part != NO_PARTITION)
1444 rtx x = SA.partition_to_pseudo[part];
1445 gcc_assert (x);
1446 gcc_assert (REG_P (x));
1447 return;
1449 gcc_unreachable ();
1452 tree decl = var;
1453 tree type = TREE_TYPE (decl);
1454 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1455 rtx x = gen_reg_rtx (reg_mode);
1457 set_rtl (var, x);
1459 /* Note if the object is a user variable. */
1460 if (!DECL_ARTIFICIAL (decl))
1461 mark_user_reg (x);
1463 if (POINTER_TYPE_P (type))
1464 mark_reg_pointer (x, get_pointer_alignment (var));
1467 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1468 has some associated error, e.g. its type is error-mark. We just need
1469 to pick something that won't crash the rest of the compiler. */
1471 static void
1472 expand_one_error_var (tree var)
1474 machine_mode mode = DECL_MODE (var);
1475 rtx x;
1477 if (mode == BLKmode)
1478 x = gen_rtx_MEM (BLKmode, const0_rtx);
1479 else if (mode == VOIDmode)
1480 x = const0_rtx;
1481 else
1482 x = gen_reg_rtx (mode);
1484 SET_DECL_RTL (var, x);
1487 /* A subroutine of expand_one_var. VAR is a variable that will be
1488 allocated to the local stack frame. Return true if we wish to
1489 add VAR to STACK_VARS so that it will be coalesced with other
1490 variables. Return false to allocate VAR immediately.
1492 This function is used to reduce the number of variables considered
1493 for coalescing, which reduces the size of the quadratic problem. */
1495 static bool
1496 defer_stack_allocation (tree var, bool toplevel)
1498 tree size_unit = TREE_CODE (var) == SSA_NAME
1499 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1500 : DECL_SIZE_UNIT (var);
1502 /* Whether the variable is small enough for immediate allocation not to be
1503 a problem with regard to the frame size. */
1504 bool smallish
1505 = ((HOST_WIDE_INT) tree_to_uhwi (size_unit)
1506 < PARAM_VALUE (PARAM_MIN_SIZE_FOR_STACK_SHARING));
1508 /* If stack protection is enabled, *all* stack variables must be deferred,
1509 so that we can re-order the strings to the top of the frame.
1510 Similarly for Address Sanitizer. */
1511 if (flag_stack_protect || ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK))
1512 return true;
1514 unsigned int align = TREE_CODE (var) == SSA_NAME
1515 ? TYPE_ALIGN (TREE_TYPE (var))
1516 : DECL_ALIGN (var);
1518 /* We handle "large" alignment via dynamic allocation. We want to handle
1519 this extra complication in only one place, so defer them. */
1520 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1521 return true;
1523 bool ignored = TREE_CODE (var) == SSA_NAME
1524 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1525 : DECL_IGNORED_P (var);
1527 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1528 might be detached from their block and appear at toplevel when we reach
1529 here. We want to coalesce them with variables from other blocks when
1530 the immediate contribution to the frame size would be noticeable. */
1531 if (toplevel && optimize > 0 && ignored && !smallish)
1532 return true;
1534 /* Variables declared in the outermost scope automatically conflict
1535 with every other variable. The only reason to want to defer them
1536 at all is that, after sorting, we can more efficiently pack
1537 small variables in the stack frame. Continue to defer at -O2. */
1538 if (toplevel && optimize < 2)
1539 return false;
1541 /* Without optimization, *most* variables are allocated from the
1542 stack, which makes the quadratic problem large exactly when we
1543 want compilation to proceed as quickly as possible. On the
1544 other hand, we don't want the function's stack frame size to
1545 get completely out of hand. So we avoid adding scalars and
1546 "small" aggregates to the list at all. */
1547 if (optimize == 0 && smallish)
1548 return false;
1550 return true;
1553 /* A subroutine of expand_used_vars. Expand one variable according to
1554 its flavor. Variables to be placed on the stack are not actually
1555 expanded yet, merely recorded.
1556 When REALLY_EXPAND is false, only add stack values to be allocated.
1557 Return stack usage this variable is supposed to take.
1560 static HOST_WIDE_INT
1561 expand_one_var (tree var, bool toplevel, bool really_expand)
1563 unsigned int align = BITS_PER_UNIT;
1564 tree origvar = var;
1566 var = SSAVAR (var);
1568 if (TREE_TYPE (var) != error_mark_node && TREE_CODE (var) == VAR_DECL)
1570 /* Because we don't know if VAR will be in register or on stack,
1571 we conservatively assume it will be on stack even if VAR is
1572 eventually put into register after RA pass. For non-automatic
1573 variables, which won't be on stack, we collect alignment of
1574 type and ignore user specified alignment. Similarly for
1575 SSA_NAMEs for which use_register_for_decl returns true. */
1576 if (TREE_STATIC (var)
1577 || DECL_EXTERNAL (var)
1578 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1579 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1580 TYPE_MODE (TREE_TYPE (var)),
1581 TYPE_ALIGN (TREE_TYPE (var)));
1582 else if (DECL_HAS_VALUE_EXPR_P (var)
1583 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1584 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1585 or variables which were assigned a stack slot already by
1586 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1587 changed from the offset chosen to it. */
1588 align = crtl->stack_alignment_estimated;
1589 else
1590 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1592 /* If the variable alignment is very large we'll dynamicaly allocate
1593 it, which means that in-frame portion is just a pointer. */
1594 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1595 align = POINTER_SIZE;
1598 record_alignment_for_reg_var (align);
1600 if (TREE_CODE (origvar) == SSA_NAME)
1602 gcc_assert (TREE_CODE (var) != VAR_DECL
1603 || (!DECL_EXTERNAL (var)
1604 && !DECL_HAS_VALUE_EXPR_P (var)
1605 && !TREE_STATIC (var)
1606 && TREE_TYPE (var) != error_mark_node
1607 && !DECL_HARD_REGISTER (var)
1608 && really_expand));
1610 if (TREE_CODE (var) != VAR_DECL && TREE_CODE (origvar) != SSA_NAME)
1612 else if (DECL_EXTERNAL (var))
1614 else if (DECL_HAS_VALUE_EXPR_P (var))
1616 else if (TREE_STATIC (var))
1618 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1620 else if (TREE_TYPE (var) == error_mark_node)
1622 if (really_expand)
1623 expand_one_error_var (var);
1625 else if (TREE_CODE (var) == VAR_DECL && DECL_HARD_REGISTER (var))
1627 if (really_expand)
1629 expand_one_hard_reg_var (var);
1630 if (!DECL_HARD_REGISTER (var))
1631 /* Invalid register specification. */
1632 expand_one_error_var (var);
1635 else if (use_register_for_decl (var))
1637 if (really_expand)
1638 expand_one_register_var (origvar);
1640 else if (! valid_constant_size_p (DECL_SIZE_UNIT (var)))
1642 /* Reject variables which cover more than half of the address-space. */
1643 if (really_expand)
1645 error ("size of variable %q+D is too large", var);
1646 expand_one_error_var (var);
1649 else if (defer_stack_allocation (var, toplevel))
1650 add_stack_var (origvar);
1651 else
1653 if (really_expand)
1655 if (lookup_attribute ("naked",
1656 DECL_ATTRIBUTES (current_function_decl)))
1657 error ("cannot allocate stack for variable %q+D, naked function.",
1658 var);
1660 expand_one_stack_var (origvar);
1664 return tree_to_uhwi (DECL_SIZE_UNIT (var));
1666 return 0;
1669 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1670 expanding variables. Those variables that can be put into registers
1671 are allocated pseudos; those that can't are put on the stack.
1673 TOPLEVEL is true if this is the outermost BLOCK. */
1675 static void
1676 expand_used_vars_for_block (tree block, bool toplevel)
1678 tree t;
1680 /* Expand all variables at this level. */
1681 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1682 if (TREE_USED (t)
1683 && ((TREE_CODE (t) != VAR_DECL && TREE_CODE (t) != RESULT_DECL)
1684 || !DECL_NONSHAREABLE (t)))
1685 expand_one_var (t, toplevel, true);
1687 /* Expand all variables at containing levels. */
1688 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1689 expand_used_vars_for_block (t, false);
1692 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1693 and clear TREE_USED on all local variables. */
1695 static void
1696 clear_tree_used (tree block)
1698 tree t;
1700 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1701 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1702 if ((TREE_CODE (t) != VAR_DECL && TREE_CODE (t) != RESULT_DECL)
1703 || !DECL_NONSHAREABLE (t))
1704 TREE_USED (t) = 0;
1706 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1707 clear_tree_used (t);
1710 enum {
1711 SPCT_FLAG_DEFAULT = 1,
1712 SPCT_FLAG_ALL = 2,
1713 SPCT_FLAG_STRONG = 3,
1714 SPCT_FLAG_EXPLICIT = 4
1717 /* Examine TYPE and determine a bit mask of the following features. */
1719 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1720 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1721 #define SPCT_HAS_ARRAY 4
1722 #define SPCT_HAS_AGGREGATE 8
1724 static unsigned int
1725 stack_protect_classify_type (tree type)
1727 unsigned int ret = 0;
1728 tree t;
1730 switch (TREE_CODE (type))
1732 case ARRAY_TYPE:
1733 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1734 if (t == char_type_node
1735 || t == signed_char_type_node
1736 || t == unsigned_char_type_node)
1738 unsigned HOST_WIDE_INT max = PARAM_VALUE (PARAM_SSP_BUFFER_SIZE);
1739 unsigned HOST_WIDE_INT len;
1741 if (!TYPE_SIZE_UNIT (type)
1742 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1743 len = max;
1744 else
1745 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1747 if (len < max)
1748 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1749 else
1750 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1752 else
1753 ret = SPCT_HAS_ARRAY;
1754 break;
1756 case UNION_TYPE:
1757 case QUAL_UNION_TYPE:
1758 case RECORD_TYPE:
1759 ret = SPCT_HAS_AGGREGATE;
1760 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1761 if (TREE_CODE (t) == FIELD_DECL)
1762 ret |= stack_protect_classify_type (TREE_TYPE (t));
1763 break;
1765 default:
1766 break;
1769 return ret;
1772 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1773 part of the local stack frame. Remember if we ever return nonzero for
1774 any variable in this function. The return value is the phase number in
1775 which the variable should be allocated. */
1777 static int
1778 stack_protect_decl_phase (tree decl)
1780 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1781 int ret = 0;
1783 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1784 has_short_buffer = true;
1786 if (flag_stack_protect == SPCT_FLAG_ALL
1787 || flag_stack_protect == SPCT_FLAG_STRONG
1788 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1789 && lookup_attribute ("stack_protect",
1790 DECL_ATTRIBUTES (current_function_decl))))
1792 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1793 && !(bits & SPCT_HAS_AGGREGATE))
1794 ret = 1;
1795 else if (bits & SPCT_HAS_ARRAY)
1796 ret = 2;
1798 else
1799 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1801 if (ret)
1802 has_protected_decls = true;
1804 return ret;
1807 /* Two helper routines that check for phase 1 and phase 2. These are used
1808 as callbacks for expand_stack_vars. */
1810 static bool
1811 stack_protect_decl_phase_1 (size_t i)
1813 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1816 static bool
1817 stack_protect_decl_phase_2 (size_t i)
1819 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1822 /* And helper function that checks for asan phase (with stack protector
1823 it is phase 3). This is used as callback for expand_stack_vars.
1824 Returns true if any of the vars in the partition need to be protected. */
1826 static bool
1827 asan_decl_phase_3 (size_t i)
1829 while (i != EOC)
1831 if (asan_protect_stack_decl (stack_vars[i].decl))
1832 return true;
1833 i = stack_vars[i].next;
1835 return false;
1838 /* Ensure that variables in different stack protection phases conflict
1839 so that they are not merged and share the same stack slot. */
1841 static void
1842 add_stack_protection_conflicts (void)
1844 size_t i, j, n = stack_vars_num;
1845 unsigned char *phase;
1847 phase = XNEWVEC (unsigned char, n);
1848 for (i = 0; i < n; ++i)
1849 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1851 for (i = 0; i < n; ++i)
1853 unsigned char ph_i = phase[i];
1854 for (j = i + 1; j < n; ++j)
1855 if (ph_i != phase[j])
1856 add_stack_var_conflict (i, j);
1859 XDELETEVEC (phase);
1862 /* Create a decl for the guard at the top of the stack frame. */
1864 static void
1865 create_stack_guard (void)
1867 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1868 VAR_DECL, NULL, ptr_type_node);
1869 TREE_THIS_VOLATILE (guard) = 1;
1870 TREE_USED (guard) = 1;
1871 expand_one_stack_var (guard);
1872 crtl->stack_protect_guard = guard;
1875 /* Prepare for expanding variables. */
1876 static void
1877 init_vars_expansion (void)
1879 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1880 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1882 /* A map from decl to stack partition. */
1883 decl_to_stack_part = new hash_map<tree, size_t>;
1885 /* Initialize local stack smashing state. */
1886 has_protected_decls = false;
1887 has_short_buffer = false;
1890 /* Free up stack variable graph data. */
1891 static void
1892 fini_vars_expansion (void)
1894 bitmap_obstack_release (&stack_var_bitmap_obstack);
1895 if (stack_vars)
1896 XDELETEVEC (stack_vars);
1897 if (stack_vars_sorted)
1898 XDELETEVEC (stack_vars_sorted);
1899 stack_vars = NULL;
1900 stack_vars_sorted = NULL;
1901 stack_vars_alloc = stack_vars_num = 0;
1902 delete decl_to_stack_part;
1903 decl_to_stack_part = NULL;
1906 /* Make a fair guess for the size of the stack frame of the function
1907 in NODE. This doesn't have to be exact, the result is only used in
1908 the inline heuristics. So we don't want to run the full stack var
1909 packing algorithm (which is quadratic in the number of stack vars).
1910 Instead, we calculate the total size of all stack vars. This turns
1911 out to be a pretty fair estimate -- packing of stack vars doesn't
1912 happen very often. */
1914 HOST_WIDE_INT
1915 estimated_stack_frame_size (struct cgraph_node *node)
1917 HOST_WIDE_INT size = 0;
1918 size_t i;
1919 tree var;
1920 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1922 push_cfun (fn);
1924 init_vars_expansion ();
1926 FOR_EACH_LOCAL_DECL (fn, i, var)
1927 if (auto_var_in_fn_p (var, fn->decl))
1928 size += expand_one_var (var, true, false);
1930 if (stack_vars_num > 0)
1932 /* Fake sorting the stack vars for account_stack_vars (). */
1933 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1934 for (i = 0; i < stack_vars_num; ++i)
1935 stack_vars_sorted[i] = i;
1936 size += account_stack_vars ();
1939 fini_vars_expansion ();
1940 pop_cfun ();
1941 return size;
1944 /* Helper routine to check if a record or union contains an array field. */
1946 static int
1947 record_or_union_type_has_array_p (const_tree tree_type)
1949 tree fields = TYPE_FIELDS (tree_type);
1950 tree f;
1952 for (f = fields; f; f = DECL_CHAIN (f))
1953 if (TREE_CODE (f) == FIELD_DECL)
1955 tree field_type = TREE_TYPE (f);
1956 if (RECORD_OR_UNION_TYPE_P (field_type)
1957 && record_or_union_type_has_array_p (field_type))
1958 return 1;
1959 if (TREE_CODE (field_type) == ARRAY_TYPE)
1960 return 1;
1962 return 0;
1965 /* Check if the current function has local referenced variables that
1966 have their addresses taken, contain an array, or are arrays. */
1968 static bool
1969 stack_protect_decl_p ()
1971 unsigned i;
1972 tree var;
1974 FOR_EACH_LOCAL_DECL (cfun, i, var)
1975 if (!is_global_var (var))
1977 tree var_type = TREE_TYPE (var);
1978 if (TREE_CODE (var) == VAR_DECL
1979 && (TREE_CODE (var_type) == ARRAY_TYPE
1980 || TREE_ADDRESSABLE (var)
1981 || (RECORD_OR_UNION_TYPE_P (var_type)
1982 && record_or_union_type_has_array_p (var_type))))
1983 return true;
1985 return false;
1988 /* Check if the current function has calls that use a return slot. */
1990 static bool
1991 stack_protect_return_slot_p ()
1993 basic_block bb;
1995 FOR_ALL_BB_FN (bb, cfun)
1996 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
1997 !gsi_end_p (gsi); gsi_next (&gsi))
1999 gimple *stmt = gsi_stmt (gsi);
2000 /* This assumes that calls to internal-only functions never
2001 use a return slot. */
2002 if (is_gimple_call (stmt)
2003 && !gimple_call_internal_p (stmt)
2004 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2005 gimple_call_fndecl (stmt)))
2006 return true;
2008 return false;
2011 /* Expand all variables used in the function. */
2013 static rtx_insn *
2014 expand_used_vars (void)
2016 tree var, outer_block = DECL_INITIAL (current_function_decl);
2017 vec<tree> maybe_local_decls = vNULL;
2018 rtx_insn *var_end_seq = NULL;
2019 unsigned i;
2020 unsigned len;
2021 bool gen_stack_protect_signal = false;
2023 /* Compute the phase of the stack frame for this function. */
2025 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2026 int off = STARTING_FRAME_OFFSET % align;
2027 frame_phase = off ? align - off : 0;
2030 /* Set TREE_USED on all variables in the local_decls. */
2031 FOR_EACH_LOCAL_DECL (cfun, i, var)
2032 TREE_USED (var) = 1;
2033 /* Clear TREE_USED on all variables associated with a block scope. */
2034 clear_tree_used (DECL_INITIAL (current_function_decl));
2036 init_vars_expansion ();
2038 if (targetm.use_pseudo_pic_reg ())
2039 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2041 for (i = 0; i < SA.map->num_partitions; i++)
2043 tree var = partition_to_var (SA.map, i);
2045 gcc_assert (!virtual_operand_p (var));
2047 expand_one_ssa_partition (var);
2050 for (i = 1; i < num_ssa_names; i++)
2051 adjust_one_expanded_partition_var (ssa_name (i));
2053 if (flag_stack_protect == SPCT_FLAG_STRONG)
2054 gen_stack_protect_signal
2055 = stack_protect_decl_p () || stack_protect_return_slot_p ();
2057 /* At this point all variables on the local_decls with TREE_USED
2058 set are not associated with any block scope. Lay them out. */
2060 len = vec_safe_length (cfun->local_decls);
2061 FOR_EACH_LOCAL_DECL (cfun, i, var)
2063 bool expand_now = false;
2065 /* Expanded above already. */
2066 if (is_gimple_reg (var))
2068 TREE_USED (var) = 0;
2069 goto next;
2071 /* We didn't set a block for static or extern because it's hard
2072 to tell the difference between a global variable (re)declared
2073 in a local scope, and one that's really declared there to
2074 begin with. And it doesn't really matter much, since we're
2075 not giving them stack space. Expand them now. */
2076 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2077 expand_now = true;
2079 /* Expand variables not associated with any block now. Those created by
2080 the optimizers could be live anywhere in the function. Those that
2081 could possibly have been scoped originally and detached from their
2082 block will have their allocation deferred so we coalesce them with
2083 others when optimization is enabled. */
2084 else if (TREE_USED (var))
2085 expand_now = true;
2087 /* Finally, mark all variables on the list as used. We'll use
2088 this in a moment when we expand those associated with scopes. */
2089 TREE_USED (var) = 1;
2091 if (expand_now)
2092 expand_one_var (var, true, true);
2094 next:
2095 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2097 rtx rtl = DECL_RTL_IF_SET (var);
2099 /* Keep artificial non-ignored vars in cfun->local_decls
2100 chain until instantiate_decls. */
2101 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2102 add_local_decl (cfun, var);
2103 else if (rtl == NULL_RTX)
2104 /* If rtl isn't set yet, which can happen e.g. with
2105 -fstack-protector, retry before returning from this
2106 function. */
2107 maybe_local_decls.safe_push (var);
2111 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2113 +-----------------+-----------------+
2114 | ...processed... | ...duplicates...|
2115 +-----------------+-----------------+
2117 +-- LEN points here.
2119 We just want the duplicates, as those are the artificial
2120 non-ignored vars that we want to keep until instantiate_decls.
2121 Move them down and truncate the array. */
2122 if (!vec_safe_is_empty (cfun->local_decls))
2123 cfun->local_decls->block_remove (0, len);
2125 /* At this point, all variables within the block tree with TREE_USED
2126 set are actually used by the optimized function. Lay them out. */
2127 expand_used_vars_for_block (outer_block, true);
2129 if (stack_vars_num > 0)
2131 add_scope_conflicts ();
2133 /* If stack protection is enabled, we don't share space between
2134 vulnerable data and non-vulnerable data. */
2135 if (flag_stack_protect != 0
2136 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2137 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2138 && lookup_attribute ("stack_protect",
2139 DECL_ATTRIBUTES (current_function_decl)))))
2140 add_stack_protection_conflicts ();
2142 /* Now that we have collected all stack variables, and have computed a
2143 minimal interference graph, attempt to save some stack space. */
2144 partition_stack_vars ();
2145 if (dump_file)
2146 dump_stack_var_partition ();
2149 switch (flag_stack_protect)
2151 case SPCT_FLAG_ALL:
2152 create_stack_guard ();
2153 break;
2155 case SPCT_FLAG_STRONG:
2156 if (gen_stack_protect_signal
2157 || cfun->calls_alloca || has_protected_decls
2158 || lookup_attribute ("stack_protect",
2159 DECL_ATTRIBUTES (current_function_decl)))
2160 create_stack_guard ();
2161 break;
2163 case SPCT_FLAG_DEFAULT:
2164 if (cfun->calls_alloca || has_protected_decls
2165 || lookup_attribute ("stack_protect",
2166 DECL_ATTRIBUTES (current_function_decl)))
2167 create_stack_guard ();
2168 break;
2170 case SPCT_FLAG_EXPLICIT:
2171 if (lookup_attribute ("stack_protect",
2172 DECL_ATTRIBUTES (current_function_decl)))
2173 create_stack_guard ();
2174 break;
2175 default:
2179 /* Assign rtl to each variable based on these partitions. */
2180 if (stack_vars_num > 0)
2182 struct stack_vars_data data;
2184 data.asan_vec = vNULL;
2185 data.asan_decl_vec = vNULL;
2186 data.asan_base = NULL_RTX;
2187 data.asan_alignb = 0;
2189 /* Reorder decls to be protected by iterating over the variables
2190 array multiple times, and allocating out of each phase in turn. */
2191 /* ??? We could probably integrate this into the qsort we did
2192 earlier, such that we naturally see these variables first,
2193 and thus naturally allocate things in the right order. */
2194 if (has_protected_decls)
2196 /* Phase 1 contains only character arrays. */
2197 expand_stack_vars (stack_protect_decl_phase_1, &data);
2199 /* Phase 2 contains other kinds of arrays. */
2200 if (flag_stack_protect == SPCT_FLAG_ALL
2201 || flag_stack_protect == SPCT_FLAG_STRONG
2202 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2203 && lookup_attribute ("stack_protect",
2204 DECL_ATTRIBUTES (current_function_decl))))
2205 expand_stack_vars (stack_protect_decl_phase_2, &data);
2208 if ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK)
2209 /* Phase 3, any partitions that need asan protection
2210 in addition to phase 1 and 2. */
2211 expand_stack_vars (asan_decl_phase_3, &data);
2213 if (!data.asan_vec.is_empty ())
2215 HOST_WIDE_INT prev_offset = frame_offset;
2216 HOST_WIDE_INT offset, sz, redzonesz;
2217 redzonesz = ASAN_RED_ZONE_SIZE;
2218 sz = data.asan_vec[0] - prev_offset;
2219 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2220 && data.asan_alignb <= 4096
2221 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2222 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2223 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2224 offset
2225 = alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE);
2226 data.asan_vec.safe_push (prev_offset);
2227 data.asan_vec.safe_push (offset);
2228 /* Leave space for alignment if STRICT_ALIGNMENT. */
2229 if (STRICT_ALIGNMENT)
2230 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2231 << ASAN_SHADOW_SHIFT)
2232 / BITS_PER_UNIT, 1);
2234 var_end_seq
2235 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2236 data.asan_base,
2237 data.asan_alignb,
2238 data.asan_vec.address (),
2239 data.asan_decl_vec.address (),
2240 data.asan_vec.length ());
2243 expand_stack_vars (NULL, &data);
2245 data.asan_vec.release ();
2246 data.asan_decl_vec.release ();
2249 fini_vars_expansion ();
2251 /* If there were any artificial non-ignored vars without rtl
2252 found earlier, see if deferred stack allocation hasn't assigned
2253 rtl to them. */
2254 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2256 rtx rtl = DECL_RTL_IF_SET (var);
2258 /* Keep artificial non-ignored vars in cfun->local_decls
2259 chain until instantiate_decls. */
2260 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2261 add_local_decl (cfun, var);
2263 maybe_local_decls.release ();
2265 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2266 if (STACK_ALIGNMENT_NEEDED)
2268 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2269 if (!FRAME_GROWS_DOWNWARD)
2270 frame_offset += align - 1;
2271 frame_offset &= -align;
2274 return var_end_seq;
2278 /* If we need to produce a detailed dump, print the tree representation
2279 for STMT to the dump file. SINCE is the last RTX after which the RTL
2280 generated for STMT should have been appended. */
2282 static void
2283 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2285 if (dump_file && (dump_flags & TDF_DETAILS))
2287 fprintf (dump_file, "\n;; ");
2288 print_gimple_stmt (dump_file, stmt, 0,
2289 TDF_SLIM | (dump_flags & TDF_LINENO));
2290 fprintf (dump_file, "\n");
2292 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2296 /* Maps the blocks that do not contain tree labels to rtx labels. */
2298 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2300 /* Returns the label_rtx expression for a label starting basic block BB. */
2302 static rtx_code_label *
2303 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2305 gimple_stmt_iterator gsi;
2306 tree lab;
2308 if (bb->flags & BB_RTL)
2309 return block_label (bb);
2311 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2312 if (elt)
2313 return *elt;
2315 /* Find the tree label if it is present. */
2317 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2319 glabel *lab_stmt;
2321 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2322 if (!lab_stmt)
2323 break;
2325 lab = gimple_label_label (lab_stmt);
2326 if (DECL_NONLOCAL (lab))
2327 break;
2329 return jump_target_rtx (lab);
2332 rtx_code_label *l = gen_label_rtx ();
2333 lab_rtx_for_bb->put (bb, l);
2334 return l;
2338 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2339 of a basic block where we just expanded the conditional at the end,
2340 possibly clean up the CFG and instruction sequence. LAST is the
2341 last instruction before the just emitted jump sequence. */
2343 static void
2344 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2346 /* Special case: when jumpif decides that the condition is
2347 trivial it emits an unconditional jump (and the necessary
2348 barrier). But we still have two edges, the fallthru one is
2349 wrong. purge_dead_edges would clean this up later. Unfortunately
2350 we have to insert insns (and split edges) before
2351 find_many_sub_basic_blocks and hence before purge_dead_edges.
2352 But splitting edges might create new blocks which depend on the
2353 fact that if there are two edges there's no barrier. So the
2354 barrier would get lost and verify_flow_info would ICE. Instead
2355 of auditing all edge splitters to care for the barrier (which
2356 normally isn't there in a cleaned CFG), fix it here. */
2357 if (BARRIER_P (get_last_insn ()))
2359 rtx_insn *insn;
2360 remove_edge (e);
2361 /* Now, we have a single successor block, if we have insns to
2362 insert on the remaining edge we potentially will insert
2363 it at the end of this block (if the dest block isn't feasible)
2364 in order to avoid splitting the edge. This insertion will take
2365 place in front of the last jump. But we might have emitted
2366 multiple jumps (conditional and one unconditional) to the
2367 same destination. Inserting in front of the last one then
2368 is a problem. See PR 40021. We fix this by deleting all
2369 jumps except the last unconditional one. */
2370 insn = PREV_INSN (get_last_insn ());
2371 /* Make sure we have an unconditional jump. Otherwise we're
2372 confused. */
2373 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2374 for (insn = PREV_INSN (insn); insn != last;)
2376 insn = PREV_INSN (insn);
2377 if (JUMP_P (NEXT_INSN (insn)))
2379 if (!any_condjump_p (NEXT_INSN (insn)))
2381 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2382 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2384 delete_insn (NEXT_INSN (insn));
2390 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2391 Returns a new basic block if we've terminated the current basic
2392 block and created a new one. */
2394 static basic_block
2395 expand_gimple_cond (basic_block bb, gcond *stmt)
2397 basic_block new_bb, dest;
2398 edge new_edge;
2399 edge true_edge;
2400 edge false_edge;
2401 rtx_insn *last2, *last;
2402 enum tree_code code;
2403 tree op0, op1;
2405 code = gimple_cond_code (stmt);
2406 op0 = gimple_cond_lhs (stmt);
2407 op1 = gimple_cond_rhs (stmt);
2408 /* We're sometimes presented with such code:
2409 D.123_1 = x < y;
2410 if (D.123_1 != 0)
2412 This would expand to two comparisons which then later might
2413 be cleaned up by combine. But some pattern matchers like if-conversion
2414 work better when there's only one compare, so make up for this
2415 here as special exception if TER would have made the same change. */
2416 if (SA.values
2417 && TREE_CODE (op0) == SSA_NAME
2418 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2419 && TREE_CODE (op1) == INTEGER_CST
2420 && ((gimple_cond_code (stmt) == NE_EXPR
2421 && integer_zerop (op1))
2422 || (gimple_cond_code (stmt) == EQ_EXPR
2423 && integer_onep (op1)))
2424 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2426 gimple *second = SSA_NAME_DEF_STMT (op0);
2427 if (gimple_code (second) == GIMPLE_ASSIGN)
2429 enum tree_code code2 = gimple_assign_rhs_code (second);
2430 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2432 code = code2;
2433 op0 = gimple_assign_rhs1 (second);
2434 op1 = gimple_assign_rhs2 (second);
2436 /* If jumps are cheap and the target does not support conditional
2437 compare, turn some more codes into jumpy sequences. */
2438 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2439 && targetm.gen_ccmp_first == NULL)
2441 if ((code2 == BIT_AND_EXPR
2442 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2443 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2444 || code2 == TRUTH_AND_EXPR)
2446 code = TRUTH_ANDIF_EXPR;
2447 op0 = gimple_assign_rhs1 (second);
2448 op1 = gimple_assign_rhs2 (second);
2450 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2452 code = TRUTH_ORIF_EXPR;
2453 op0 = gimple_assign_rhs1 (second);
2454 op1 = gimple_assign_rhs2 (second);
2460 last2 = last = get_last_insn ();
2462 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2463 set_curr_insn_location (gimple_location (stmt));
2465 /* These flags have no purpose in RTL land. */
2466 true_edge->flags &= ~EDGE_TRUE_VALUE;
2467 false_edge->flags &= ~EDGE_FALSE_VALUE;
2469 /* We can either have a pure conditional jump with one fallthru edge or
2470 two-way jump that needs to be decomposed into two basic blocks. */
2471 if (false_edge->dest == bb->next_bb)
2473 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2474 true_edge->probability);
2475 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2476 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2477 set_curr_insn_location (true_edge->goto_locus);
2478 false_edge->flags |= EDGE_FALLTHRU;
2479 maybe_cleanup_end_of_block (false_edge, last);
2480 return NULL;
2482 if (true_edge->dest == bb->next_bb)
2484 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2485 false_edge->probability);
2486 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2487 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2488 set_curr_insn_location (false_edge->goto_locus);
2489 true_edge->flags |= EDGE_FALLTHRU;
2490 maybe_cleanup_end_of_block (true_edge, last);
2491 return NULL;
2494 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2495 true_edge->probability);
2496 last = get_last_insn ();
2497 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2498 set_curr_insn_location (false_edge->goto_locus);
2499 emit_jump (label_rtx_for_bb (false_edge->dest));
2501 BB_END (bb) = last;
2502 if (BARRIER_P (BB_END (bb)))
2503 BB_END (bb) = PREV_INSN (BB_END (bb));
2504 update_bb_for_insn (bb);
2506 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2507 dest = false_edge->dest;
2508 redirect_edge_succ (false_edge, new_bb);
2509 false_edge->flags |= EDGE_FALLTHRU;
2510 new_bb->count = false_edge->count;
2511 new_bb->frequency = EDGE_FREQUENCY (false_edge);
2512 add_bb_to_loop (new_bb, bb->loop_father);
2513 new_edge = make_edge (new_bb, dest, 0);
2514 new_edge->probability = REG_BR_PROB_BASE;
2515 new_edge->count = new_bb->count;
2516 if (BARRIER_P (BB_END (new_bb)))
2517 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2518 update_bb_for_insn (new_bb);
2520 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2522 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2524 set_curr_insn_location (true_edge->goto_locus);
2525 true_edge->goto_locus = curr_insn_location ();
2528 return new_bb;
2531 /* Mark all calls that can have a transaction restart. */
2533 static void
2534 mark_transaction_restart_calls (gimple *stmt)
2536 struct tm_restart_node dummy;
2537 tm_restart_node **slot;
2539 if (!cfun->gimple_df->tm_restart)
2540 return;
2542 dummy.stmt = stmt;
2543 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2544 if (slot)
2546 struct tm_restart_node *n = *slot;
2547 tree list = n->label_or_list;
2548 rtx_insn *insn;
2550 for (insn = next_real_insn (get_last_insn ());
2551 !CALL_P (insn);
2552 insn = next_real_insn (insn))
2553 continue;
2555 if (TREE_CODE (list) == LABEL_DECL)
2556 add_reg_note (insn, REG_TM, label_rtx (list));
2557 else
2558 for (; list ; list = TREE_CHAIN (list))
2559 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2563 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2564 statement STMT. */
2566 static void
2567 expand_call_stmt (gcall *stmt)
2569 tree exp, decl, lhs;
2570 bool builtin_p;
2571 size_t i;
2573 if (gimple_call_internal_p (stmt))
2575 expand_internal_call (stmt);
2576 return;
2579 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2581 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2582 decl = gimple_call_fndecl (stmt);
2583 builtin_p = decl && DECL_BUILT_IN (decl);
2585 /* If this is not a builtin function, the function type through which the
2586 call is made may be different from the type of the function. */
2587 if (!builtin_p)
2588 CALL_EXPR_FN (exp)
2589 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2590 CALL_EXPR_FN (exp));
2592 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2593 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2595 for (i = 0; i < gimple_call_num_args (stmt); i++)
2597 tree arg = gimple_call_arg (stmt, i);
2598 gimple *def;
2599 /* TER addresses into arguments of builtin functions so we have a
2600 chance to infer more correct alignment information. See PR39954. */
2601 if (builtin_p
2602 && TREE_CODE (arg) == SSA_NAME
2603 && (def = get_gimple_for_ssa_name (arg))
2604 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2605 arg = gimple_assign_rhs1 (def);
2606 CALL_EXPR_ARG (exp, i) = arg;
2609 if (gimple_has_side_effects (stmt))
2610 TREE_SIDE_EFFECTS (exp) = 1;
2612 if (gimple_call_nothrow_p (stmt))
2613 TREE_NOTHROW (exp) = 1;
2615 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2616 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2617 if (decl
2618 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
2619 && (DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA
2620 || DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA_WITH_ALIGN))
2621 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2622 else
2623 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2624 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2625 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2626 CALL_WITH_BOUNDS_P (exp) = gimple_call_with_bounds_p (stmt);
2628 /* Ensure RTL is created for debug args. */
2629 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2631 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2632 unsigned int ix;
2633 tree dtemp;
2635 if (debug_args)
2636 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2638 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2639 expand_debug_expr (dtemp);
2643 lhs = gimple_call_lhs (stmt);
2644 if (lhs)
2645 expand_assignment (lhs, exp, false);
2646 else
2647 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2649 mark_transaction_restart_calls (stmt);
2653 /* Generate RTL for an asm statement (explicit assembler code).
2654 STRING is a STRING_CST node containing the assembler code text,
2655 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2656 insn is volatile; don't optimize it. */
2658 static void
2659 expand_asm_loc (tree string, int vol, location_t locus)
2661 rtx body;
2663 if (TREE_CODE (string) == ADDR_EXPR)
2664 string = TREE_OPERAND (string, 0);
2666 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2667 ggc_strdup (TREE_STRING_POINTER (string)),
2668 locus);
2670 MEM_VOLATILE_P (body) = vol;
2672 emit_insn (body);
2675 /* Return the number of times character C occurs in string S. */
2676 static int
2677 n_occurrences (int c, const char *s)
2679 int n = 0;
2680 while (*s)
2681 n += (*s++ == c);
2682 return n;
2685 /* A subroutine of expand_asm_operands. Check that all operands have
2686 the same number of alternatives. Return true if so. */
2688 static bool
2689 check_operand_nalternatives (const vec<const char *> &constraints)
2691 unsigned len = constraints.length();
2692 if (len > 0)
2694 int nalternatives = n_occurrences (',', constraints[0]);
2696 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2698 error ("too many alternatives in %<asm%>");
2699 return false;
2702 for (unsigned i = 1; i < len; ++i)
2703 if (n_occurrences (',', constraints[i]) != nalternatives)
2705 error ("operand constraints for %<asm%> differ "
2706 "in number of alternatives");
2707 return false;
2710 return true;
2713 /* Check for overlap between registers marked in CLOBBERED_REGS and
2714 anything inappropriate in T. Emit error and return the register
2715 variable definition for error, NULL_TREE for ok. */
2717 static bool
2718 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2720 /* Conflicts between asm-declared register variables and the clobber
2721 list are not allowed. */
2722 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2724 if (overlap)
2726 error ("asm-specifier for variable %qE conflicts with asm clobber list",
2727 DECL_NAME (overlap));
2729 /* Reset registerness to stop multiple errors emitted for a single
2730 variable. */
2731 DECL_REGISTER (overlap) = 0;
2732 return true;
2735 return false;
2738 /* Generate RTL for an asm statement with arguments.
2739 STRING is the instruction template.
2740 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2741 Each output or input has an expression in the TREE_VALUE and
2742 a tree list in TREE_PURPOSE which in turn contains a constraint
2743 name in TREE_VALUE (or NULL_TREE) and a constraint string
2744 in TREE_PURPOSE.
2745 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2746 that is clobbered by this insn.
2748 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2749 should be the fallthru basic block of the asm goto.
2751 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2752 Some elements of OUTPUTS may be replaced with trees representing temporary
2753 values. The caller should copy those temporary values to the originally
2754 specified lvalues.
2756 VOL nonzero means the insn is volatile; don't optimize it. */
2758 static void
2759 expand_asm_stmt (gasm *stmt)
2761 class save_input_location
2763 location_t old;
2765 public:
2766 explicit save_input_location(location_t where)
2768 old = input_location;
2769 input_location = where;
2772 ~save_input_location()
2774 input_location = old;
2778 location_t locus = gimple_location (stmt);
2780 if (gimple_asm_input_p (stmt))
2782 const char *s = gimple_asm_string (stmt);
2783 tree string = build_string (strlen (s), s);
2784 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
2785 return;
2788 /* There are some legacy diagnostics in here, and also avoids a
2789 sixth parameger to targetm.md_asm_adjust. */
2790 save_input_location s_i_l(locus);
2792 unsigned noutputs = gimple_asm_noutputs (stmt);
2793 unsigned ninputs = gimple_asm_ninputs (stmt);
2794 unsigned nlabels = gimple_asm_nlabels (stmt);
2795 unsigned i;
2797 /* ??? Diagnose during gimplification? */
2798 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
2800 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2801 return;
2804 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
2805 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
2806 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
2808 /* Copy the gimple vectors into new vectors that we can manipulate. */
2810 output_tvec.safe_grow (noutputs);
2811 input_tvec.safe_grow (ninputs);
2812 constraints.safe_grow (noutputs + ninputs);
2814 for (i = 0; i < noutputs; ++i)
2816 tree t = gimple_asm_output_op (stmt, i);
2817 output_tvec[i] = TREE_VALUE (t);
2818 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2820 for (i = 0; i < ninputs; i++)
2822 tree t = gimple_asm_input_op (stmt, i);
2823 input_tvec[i] = TREE_VALUE (t);
2824 constraints[i + noutputs]
2825 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2828 /* ??? Diagnose during gimplification? */
2829 if (! check_operand_nalternatives (constraints))
2830 return;
2832 /* Count the number of meaningful clobbered registers, ignoring what
2833 we would ignore later. */
2834 auto_vec<rtx> clobber_rvec;
2835 HARD_REG_SET clobbered_regs;
2836 CLEAR_HARD_REG_SET (clobbered_regs);
2838 if (unsigned n = gimple_asm_nclobbers (stmt))
2840 clobber_rvec.reserve (n);
2841 for (i = 0; i < n; i++)
2843 tree t = gimple_asm_clobber_op (stmt, i);
2844 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
2845 int nregs, j;
2847 j = decode_reg_name_and_count (regname, &nregs);
2848 if (j < 0)
2850 if (j == -2)
2852 /* ??? Diagnose during gimplification? */
2853 error ("unknown register name %qs in %<asm%>", regname);
2855 else if (j == -4)
2857 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2858 clobber_rvec.safe_push (x);
2860 else
2862 /* Otherwise we should have -1 == empty string
2863 or -3 == cc, which is not a register. */
2864 gcc_assert (j == -1 || j == -3);
2867 else
2868 for (int reg = j; reg < j + nregs; reg++)
2870 /* Clobbering the PIC register is an error. */
2871 if (reg == (int) PIC_OFFSET_TABLE_REGNUM)
2873 /* ??? Diagnose during gimplification? */
2874 error ("PIC register clobbered by %qs in %<asm%>",
2875 regname);
2876 return;
2879 SET_HARD_REG_BIT (clobbered_regs, reg);
2880 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
2881 clobber_rvec.safe_push (x);
2885 unsigned nclobbers = clobber_rvec.length();
2887 /* First pass over inputs and outputs checks validity and sets
2888 mark_addressable if needed. */
2889 /* ??? Diagnose during gimplification? */
2891 for (i = 0; i < noutputs; ++i)
2893 tree val = output_tvec[i];
2894 tree type = TREE_TYPE (val);
2895 const char *constraint;
2896 bool is_inout;
2897 bool allows_reg;
2898 bool allows_mem;
2900 /* Try to parse the output constraint. If that fails, there's
2901 no point in going further. */
2902 constraint = constraints[i];
2903 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
2904 &allows_mem, &allows_reg, &is_inout))
2905 return;
2907 if (! allows_reg
2908 && (allows_mem
2909 || is_inout
2910 || (DECL_P (val)
2911 && REG_P (DECL_RTL (val))
2912 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
2913 mark_addressable (val);
2916 for (i = 0; i < ninputs; ++i)
2918 bool allows_reg, allows_mem;
2919 const char *constraint;
2921 constraint = constraints[i + noutputs];
2922 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
2923 constraints.address (),
2924 &allows_mem, &allows_reg))
2925 return;
2927 if (! allows_reg && allows_mem)
2928 mark_addressable (input_tvec[i]);
2931 /* Second pass evaluates arguments. */
2933 /* Make sure stack is consistent for asm goto. */
2934 if (nlabels > 0)
2935 do_pending_stack_adjust ();
2936 int old_generating_concat_p = generating_concat_p;
2938 /* Vector of RTX's of evaluated output operands. */
2939 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
2940 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
2941 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
2943 output_rvec.safe_grow (noutputs);
2945 for (i = 0; i < noutputs; ++i)
2947 tree val = output_tvec[i];
2948 tree type = TREE_TYPE (val);
2949 bool is_inout, allows_reg, allows_mem, ok;
2950 rtx op;
2952 ok = parse_output_constraint (&constraints[i], i, ninputs,
2953 noutputs, &allows_mem, &allows_reg,
2954 &is_inout);
2955 gcc_assert (ok);
2957 /* If an output operand is not a decl or indirect ref and our constraint
2958 allows a register, make a temporary to act as an intermediate.
2959 Make the asm insn write into that, then we will copy it to
2960 the real output operand. Likewise for promoted variables. */
2962 generating_concat_p = 0;
2964 if ((TREE_CODE (val) == INDIRECT_REF
2965 && allows_mem)
2966 || (DECL_P (val)
2967 && (allows_mem || REG_P (DECL_RTL (val)))
2968 && ! (REG_P (DECL_RTL (val))
2969 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
2970 || ! allows_reg
2971 || is_inout)
2973 op = expand_expr (val, NULL_RTX, VOIDmode,
2974 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
2975 if (MEM_P (op))
2976 op = validize_mem (op);
2978 if (! allows_reg && !MEM_P (op))
2979 error ("output number %d not directly addressable", i);
2980 if ((! allows_mem && MEM_P (op))
2981 || GET_CODE (op) == CONCAT)
2983 rtx old_op = op;
2984 op = gen_reg_rtx (GET_MODE (op));
2986 generating_concat_p = old_generating_concat_p;
2988 if (is_inout)
2989 emit_move_insn (op, old_op);
2991 push_to_sequence2 (after_rtl_seq, after_rtl_end);
2992 emit_move_insn (old_op, op);
2993 after_rtl_seq = get_insns ();
2994 after_rtl_end = get_last_insn ();
2995 end_sequence ();
2998 else
3000 op = assign_temp (type, 0, 1);
3001 op = validize_mem (op);
3002 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3003 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3005 generating_concat_p = old_generating_concat_p;
3007 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3008 expand_assignment (val, make_tree (type, op), false);
3009 after_rtl_seq = get_insns ();
3010 after_rtl_end = get_last_insn ();
3011 end_sequence ();
3013 output_rvec[i] = op;
3015 if (is_inout)
3016 inout_opnum.safe_push (i);
3019 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3020 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3022 input_rvec.safe_grow (ninputs);
3023 input_mode.safe_grow (ninputs);
3025 generating_concat_p = 0;
3027 for (i = 0; i < ninputs; ++i)
3029 tree val = input_tvec[i];
3030 tree type = TREE_TYPE (val);
3031 bool allows_reg, allows_mem, ok;
3032 const char *constraint;
3033 rtx op;
3035 constraint = constraints[i + noutputs];
3036 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3037 constraints.address (),
3038 &allows_mem, &allows_reg);
3039 gcc_assert (ok);
3041 /* EXPAND_INITIALIZER will not generate code for valid initializer
3042 constants, but will still generate code for other types of operand.
3043 This is the behavior we want for constant constraints. */
3044 op = expand_expr (val, NULL_RTX, VOIDmode,
3045 allows_reg ? EXPAND_NORMAL
3046 : allows_mem ? EXPAND_MEMORY
3047 : EXPAND_INITIALIZER);
3049 /* Never pass a CONCAT to an ASM. */
3050 if (GET_CODE (op) == CONCAT)
3051 op = force_reg (GET_MODE (op), op);
3052 else if (MEM_P (op))
3053 op = validize_mem (op);
3055 if (asm_operand_ok (op, constraint, NULL) <= 0)
3057 if (allows_reg && TYPE_MODE (type) != BLKmode)
3058 op = force_reg (TYPE_MODE (type), op);
3059 else if (!allows_mem)
3060 warning (0, "asm operand %d probably doesn%'t match constraints",
3061 i + noutputs);
3062 else if (MEM_P (op))
3064 /* We won't recognize either volatile memory or memory
3065 with a queued address as available a memory_operand
3066 at this point. Ignore it: clearly this *is* a memory. */
3068 else
3069 gcc_unreachable ();
3071 input_rvec[i] = op;
3072 input_mode[i] = TYPE_MODE (type);
3075 /* For in-out operands, copy output rtx to input rtx. */
3076 unsigned ninout = inout_opnum.length();
3077 for (i = 0; i < ninout; i++)
3079 int j = inout_opnum[i];
3080 rtx o = output_rvec[j];
3082 input_rvec.safe_push (o);
3083 input_mode.safe_push (GET_MODE (o));
3085 char buffer[16];
3086 sprintf (buffer, "%d", j);
3087 constraints.safe_push (ggc_strdup (buffer));
3089 ninputs += ninout;
3091 /* Sometimes we wish to automatically clobber registers across an asm.
3092 Case in point is when the i386 backend moved from cc0 to a hard reg --
3093 maintaining source-level compatibility means automatically clobbering
3094 the flags register. */
3095 rtx_insn *after_md_seq = NULL;
3096 if (targetm.md_asm_adjust)
3097 after_md_seq = targetm.md_asm_adjust (output_rvec, input_rvec,
3098 constraints, clobber_rvec,
3099 clobbered_regs);
3101 /* Do not allow the hook to change the output and input count,
3102 lest it mess up the operand numbering. */
3103 gcc_assert (output_rvec.length() == noutputs);
3104 gcc_assert (input_rvec.length() == ninputs);
3105 gcc_assert (constraints.length() == noutputs + ninputs);
3107 /* But it certainly can adjust the clobbers. */
3108 nclobbers = clobber_rvec.length();
3110 /* Third pass checks for easy conflicts. */
3111 /* ??? Why are we doing this on trees instead of rtx. */
3113 bool clobber_conflict_found = 0;
3114 for (i = 0; i < noutputs; ++i)
3115 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3116 clobber_conflict_found = 1;
3117 for (i = 0; i < ninputs - ninout; ++i)
3118 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3119 clobber_conflict_found = 1;
3121 /* Make vectors for the expression-rtx, constraint strings,
3122 and named operands. */
3124 rtvec argvec = rtvec_alloc (ninputs);
3125 rtvec constraintvec = rtvec_alloc (ninputs);
3126 rtvec labelvec = rtvec_alloc (nlabels);
3128 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3129 : GET_MODE (output_rvec[0])),
3130 ggc_strdup (gimple_asm_string (stmt)),
3131 empty_string, 0, argvec, constraintvec,
3132 labelvec, locus);
3133 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3135 for (i = 0; i < ninputs; ++i)
3137 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3138 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3139 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3140 constraints[i + noutputs],
3141 locus);
3144 /* Copy labels to the vector. */
3145 rtx_code_label *fallthru_label = NULL;
3146 if (nlabels > 0)
3148 basic_block fallthru_bb = NULL;
3149 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3150 if (fallthru)
3151 fallthru_bb = fallthru->dest;
3153 for (i = 0; i < nlabels; ++i)
3155 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3156 rtx_insn *r;
3157 /* If asm goto has any labels in the fallthru basic block, use
3158 a label that we emit immediately after the asm goto. Expansion
3159 may insert further instructions into the same basic block after
3160 asm goto and if we don't do this, insertion of instructions on
3161 the fallthru edge might misbehave. See PR58670. */
3162 if (fallthru_bb && label_to_block_fn (cfun, label) == fallthru_bb)
3164 if (fallthru_label == NULL_RTX)
3165 fallthru_label = gen_label_rtx ();
3166 r = fallthru_label;
3168 else
3169 r = label_rtx (label);
3170 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3174 /* Now, for each output, construct an rtx
3175 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3176 ARGVEC CONSTRAINTS OPNAMES))
3177 If there is more than one, put them inside a PARALLEL. */
3179 if (nlabels > 0 && nclobbers == 0)
3181 gcc_assert (noutputs == 0);
3182 emit_jump_insn (body);
3184 else if (noutputs == 0 && nclobbers == 0)
3186 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3187 emit_insn (body);
3189 else if (noutputs == 1 && nclobbers == 0)
3191 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3192 emit_insn (gen_rtx_SET (output_rvec[0], body));
3194 else
3196 rtx obody = body;
3197 int num = noutputs;
3199 if (num == 0)
3200 num = 1;
3202 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3204 /* For each output operand, store a SET. */
3205 for (i = 0; i < noutputs; ++i)
3207 rtx src, o = output_rvec[i];
3208 if (i == 0)
3210 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3211 src = obody;
3213 else
3215 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3216 ASM_OPERANDS_TEMPLATE (obody),
3217 constraints[i], i, argvec,
3218 constraintvec, labelvec, locus);
3219 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3221 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3224 /* If there are no outputs (but there are some clobbers)
3225 store the bare ASM_OPERANDS into the PARALLEL. */
3226 if (i == 0)
3227 XVECEXP (body, 0, i++) = obody;
3229 /* Store (clobber REG) for each clobbered register specified. */
3230 for (unsigned j = 0; j < nclobbers; ++j)
3232 rtx clobbered_reg = clobber_rvec[j];
3234 /* Do sanity check for overlap between clobbers and respectively
3235 input and outputs that hasn't been handled. Such overlap
3236 should have been detected and reported above. */
3237 if (!clobber_conflict_found && REG_P (clobbered_reg))
3239 /* We test the old body (obody) contents to avoid
3240 tripping over the under-construction body. */
3241 for (unsigned k = 0; k < noutputs; ++k)
3242 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3243 internal_error ("asm clobber conflict with output operand");
3245 for (unsigned k = 0; k < ninputs - ninout; ++k)
3246 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3247 internal_error ("asm clobber conflict with input operand");
3250 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3253 if (nlabels > 0)
3254 emit_jump_insn (body);
3255 else
3256 emit_insn (body);
3259 generating_concat_p = old_generating_concat_p;
3261 if (fallthru_label)
3262 emit_label (fallthru_label);
3264 if (after_md_seq)
3265 emit_insn (after_md_seq);
3266 if (after_rtl_seq)
3267 emit_insn (after_rtl_seq);
3269 free_temp_slots ();
3270 crtl->has_asm_statement = 1;
3273 /* Emit code to jump to the address
3274 specified by the pointer expression EXP. */
3276 static void
3277 expand_computed_goto (tree exp)
3279 rtx x = expand_normal (exp);
3281 do_pending_stack_adjust ();
3282 emit_indirect_jump (x);
3285 /* Generate RTL code for a `goto' statement with target label LABEL.
3286 LABEL should be a LABEL_DECL tree node that was or will later be
3287 defined with `expand_label'. */
3289 static void
3290 expand_goto (tree label)
3292 #ifdef ENABLE_CHECKING
3293 /* Check for a nonlocal goto to a containing function. Should have
3294 gotten translated to __builtin_nonlocal_goto. */
3295 tree context = decl_function_context (label);
3296 gcc_assert (!context || context == current_function_decl);
3297 #endif
3299 emit_jump (jump_target_rtx (label));
3302 /* Output a return with no value. */
3304 static void
3305 expand_null_return_1 (void)
3307 clear_pending_stack_adjust ();
3308 do_pending_stack_adjust ();
3309 emit_jump (return_label);
3312 /* Generate RTL to return from the current function, with no value.
3313 (That is, we do not do anything about returning any value.) */
3315 void
3316 expand_null_return (void)
3318 /* If this function was declared to return a value, but we
3319 didn't, clobber the return registers so that they are not
3320 propagated live to the rest of the function. */
3321 clobber_return_register ();
3323 expand_null_return_1 ();
3326 /* Generate RTL to return from the current function, with value VAL. */
3328 static void
3329 expand_value_return (rtx val)
3331 /* Copy the value to the return location unless it's already there. */
3333 tree decl = DECL_RESULT (current_function_decl);
3334 rtx return_reg = DECL_RTL (decl);
3335 if (return_reg != val)
3337 tree funtype = TREE_TYPE (current_function_decl);
3338 tree type = TREE_TYPE (decl);
3339 int unsignedp = TYPE_UNSIGNED (type);
3340 machine_mode old_mode = DECL_MODE (decl);
3341 machine_mode mode;
3342 if (DECL_BY_REFERENCE (decl))
3343 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3344 else
3345 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3347 if (mode != old_mode)
3348 val = convert_modes (mode, old_mode, val, unsignedp);
3350 if (GET_CODE (return_reg) == PARALLEL)
3351 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3352 else
3353 emit_move_insn (return_reg, val);
3356 expand_null_return_1 ();
3359 /* Generate RTL to evaluate the expression RETVAL and return it
3360 from the current function. */
3362 static void
3363 expand_return (tree retval, tree bounds)
3365 rtx result_rtl;
3366 rtx val = 0;
3367 tree retval_rhs;
3368 rtx bounds_rtl;
3370 /* If function wants no value, give it none. */
3371 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3373 expand_normal (retval);
3374 expand_null_return ();
3375 return;
3378 if (retval == error_mark_node)
3380 /* Treat this like a return of no value from a function that
3381 returns a value. */
3382 expand_null_return ();
3383 return;
3385 else if ((TREE_CODE (retval) == MODIFY_EXPR
3386 || TREE_CODE (retval) == INIT_EXPR)
3387 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3388 retval_rhs = TREE_OPERAND (retval, 1);
3389 else
3390 retval_rhs = retval;
3392 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3394 /* Put returned bounds to the right place. */
3395 bounds_rtl = DECL_BOUNDS_RTL (DECL_RESULT (current_function_decl));
3396 if (bounds_rtl)
3398 rtx addr = NULL;
3399 rtx bnd = NULL;
3401 if (bounds && bounds != error_mark_node)
3403 bnd = expand_normal (bounds);
3404 targetm.calls.store_returned_bounds (bounds_rtl, bnd);
3406 else if (REG_P (bounds_rtl))
3408 if (bounds)
3409 bnd = chkp_expand_zero_bounds ();
3410 else
3412 addr = expand_normal (build_fold_addr_expr (retval_rhs));
3413 addr = gen_rtx_MEM (Pmode, addr);
3414 bnd = targetm.calls.load_bounds_for_arg (addr, NULL, NULL);
3417 targetm.calls.store_returned_bounds (bounds_rtl, bnd);
3419 else
3421 int n;
3423 gcc_assert (GET_CODE (bounds_rtl) == PARALLEL);
3425 if (bounds)
3426 bnd = chkp_expand_zero_bounds ();
3427 else
3429 addr = expand_normal (build_fold_addr_expr (retval_rhs));
3430 addr = gen_rtx_MEM (Pmode, addr);
3433 for (n = 0; n < XVECLEN (bounds_rtl, 0); n++)
3435 rtx slot = XEXP (XVECEXP (bounds_rtl, 0, n), 0);
3436 if (!bounds)
3438 rtx offs = XEXP (XVECEXP (bounds_rtl, 0, n), 1);
3439 rtx from = adjust_address (addr, Pmode, INTVAL (offs));
3440 bnd = targetm.calls.load_bounds_for_arg (from, NULL, NULL);
3442 targetm.calls.store_returned_bounds (slot, bnd);
3446 else if (chkp_function_instrumented_p (current_function_decl)
3447 && !BOUNDED_P (retval_rhs)
3448 && chkp_type_has_pointer (TREE_TYPE (retval_rhs))
3449 && TREE_CODE (retval_rhs) != RESULT_DECL)
3451 rtx addr = expand_normal (build_fold_addr_expr (retval_rhs));
3452 addr = gen_rtx_MEM (Pmode, addr);
3454 gcc_assert (MEM_P (result_rtl));
3456 chkp_copy_bounds_for_stack_parm (result_rtl, addr, TREE_TYPE (retval_rhs));
3459 /* If we are returning the RESULT_DECL, then the value has already
3460 been stored into it, so we don't have to do anything special. */
3461 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3462 expand_value_return (result_rtl);
3464 /* If the result is an aggregate that is being returned in one (or more)
3465 registers, load the registers here. */
3467 else if (retval_rhs != 0
3468 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3469 && REG_P (result_rtl))
3471 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3472 if (val)
3474 /* Use the mode of the result value on the return register. */
3475 PUT_MODE (result_rtl, GET_MODE (val));
3476 expand_value_return (val);
3478 else
3479 expand_null_return ();
3481 else if (retval_rhs != 0
3482 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3483 && (REG_P (result_rtl)
3484 || (GET_CODE (result_rtl) == PARALLEL)))
3486 /* Compute the return value into a temporary (usually a pseudo reg). */
3488 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3489 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3490 val = force_not_mem (val);
3491 expand_value_return (val);
3493 else
3495 /* No hard reg used; calculate value into hard return reg. */
3496 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3497 expand_value_return (result_rtl);
3501 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3502 STMT that doesn't require special handling for outgoing edges. That
3503 is no tailcalls and no GIMPLE_COND. */
3505 static void
3506 expand_gimple_stmt_1 (gimple *stmt)
3508 tree op0;
3510 set_curr_insn_location (gimple_location (stmt));
3512 switch (gimple_code (stmt))
3514 case GIMPLE_GOTO:
3515 op0 = gimple_goto_dest (stmt);
3516 if (TREE_CODE (op0) == LABEL_DECL)
3517 expand_goto (op0);
3518 else
3519 expand_computed_goto (op0);
3520 break;
3521 case GIMPLE_LABEL:
3522 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3523 break;
3524 case GIMPLE_NOP:
3525 case GIMPLE_PREDICT:
3526 break;
3527 case GIMPLE_SWITCH:
3528 expand_case (as_a <gswitch *> (stmt));
3529 break;
3530 case GIMPLE_ASM:
3531 expand_asm_stmt (as_a <gasm *> (stmt));
3532 break;
3533 case GIMPLE_CALL:
3534 expand_call_stmt (as_a <gcall *> (stmt));
3535 break;
3537 case GIMPLE_RETURN:
3539 tree bnd = gimple_return_retbnd (as_a <greturn *> (stmt));
3540 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3542 if (op0 && op0 != error_mark_node)
3544 tree result = DECL_RESULT (current_function_decl);
3546 /* If we are not returning the current function's RESULT_DECL,
3547 build an assignment to it. */
3548 if (op0 != result)
3550 /* I believe that a function's RESULT_DECL is unique. */
3551 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3553 /* ??? We'd like to use simply expand_assignment here,
3554 but this fails if the value is of BLKmode but the return
3555 decl is a register. expand_return has special handling
3556 for this combination, which eventually should move
3557 to common code. See comments there. Until then, let's
3558 build a modify expression :-/ */
3559 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3560 result, op0);
3562 /* Mark we have return statement with missing bounds. */
3563 if (!bnd && chkp_function_instrumented_p (cfun->decl))
3564 bnd = error_mark_node;
3567 if (!op0)
3568 expand_null_return ();
3569 else
3570 expand_return (op0, bnd);
3572 break;
3574 case GIMPLE_ASSIGN:
3576 gassign *assign_stmt = as_a <gassign *> (stmt);
3577 tree lhs = gimple_assign_lhs (assign_stmt);
3579 /* Tree expand used to fiddle with |= and &= of two bitfield
3580 COMPONENT_REFs here. This can't happen with gimple, the LHS
3581 of binary assigns must be a gimple reg. */
3583 if (TREE_CODE (lhs) != SSA_NAME
3584 || get_gimple_rhs_class (gimple_expr_code (stmt))
3585 == GIMPLE_SINGLE_RHS)
3587 tree rhs = gimple_assign_rhs1 (assign_stmt);
3588 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt))
3589 == GIMPLE_SINGLE_RHS);
3590 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3591 /* Do not put locations on possibly shared trees. */
3592 && !is_gimple_min_invariant (rhs))
3593 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3594 if (TREE_CLOBBER_P (rhs))
3595 /* This is a clobber to mark the going out of scope for
3596 this LHS. */
3598 else
3599 expand_assignment (lhs, rhs,
3600 gimple_assign_nontemporal_move_p (
3601 assign_stmt));
3603 else
3605 rtx target, temp;
3606 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3607 struct separate_ops ops;
3608 bool promoted = false;
3610 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3611 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3612 promoted = true;
3614 ops.code = gimple_assign_rhs_code (assign_stmt);
3615 ops.type = TREE_TYPE (lhs);
3616 switch (get_gimple_rhs_class (ops.code))
3618 case GIMPLE_TERNARY_RHS:
3619 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3620 /* Fallthru */
3621 case GIMPLE_BINARY_RHS:
3622 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3623 /* Fallthru */
3624 case GIMPLE_UNARY_RHS:
3625 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3626 break;
3627 default:
3628 gcc_unreachable ();
3630 ops.location = gimple_location (stmt);
3632 /* If we want to use a nontemporal store, force the value to
3633 register first. If we store into a promoted register,
3634 don't directly expand to target. */
3635 temp = nontemporal || promoted ? NULL_RTX : target;
3636 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3637 EXPAND_NORMAL);
3639 if (temp == target)
3641 else if (promoted)
3643 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3644 /* If TEMP is a VOIDmode constant, use convert_modes to make
3645 sure that we properly convert it. */
3646 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3648 temp = convert_modes (GET_MODE (target),
3649 TYPE_MODE (ops.type),
3650 temp, unsignedp);
3651 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3652 GET_MODE (target), temp, unsignedp);
3655 convert_move (SUBREG_REG (target), temp, unsignedp);
3657 else if (nontemporal && emit_storent_insn (target, temp))
3659 else
3661 temp = force_operand (temp, target);
3662 if (temp != target)
3663 emit_move_insn (target, temp);
3667 break;
3669 default:
3670 gcc_unreachable ();
3674 /* Expand one gimple statement STMT and return the last RTL instruction
3675 before any of the newly generated ones.
3677 In addition to generating the necessary RTL instructions this also
3678 sets REG_EH_REGION notes if necessary and sets the current source
3679 location for diagnostics. */
3681 static rtx_insn *
3682 expand_gimple_stmt (gimple *stmt)
3684 location_t saved_location = input_location;
3685 rtx_insn *last = get_last_insn ();
3686 int lp_nr;
3688 gcc_assert (cfun);
3690 /* We need to save and restore the current source location so that errors
3691 discovered during expansion are emitted with the right location. But
3692 it would be better if the diagnostic routines used the source location
3693 embedded in the tree nodes rather than globals. */
3694 if (gimple_has_location (stmt))
3695 input_location = gimple_location (stmt);
3697 expand_gimple_stmt_1 (stmt);
3699 /* Free any temporaries used to evaluate this statement. */
3700 free_temp_slots ();
3702 input_location = saved_location;
3704 /* Mark all insns that may trap. */
3705 lp_nr = lookup_stmt_eh_lp (stmt);
3706 if (lp_nr)
3708 rtx_insn *insn;
3709 for (insn = next_real_insn (last); insn;
3710 insn = next_real_insn (insn))
3712 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3713 /* If we want exceptions for non-call insns, any
3714 may_trap_p instruction may throw. */
3715 && GET_CODE (PATTERN (insn)) != CLOBBER
3716 && GET_CODE (PATTERN (insn)) != USE
3717 && insn_could_throw_p (insn))
3718 make_reg_eh_region_note (insn, 0, lp_nr);
3722 return last;
3725 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3726 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3727 generated a tail call (something that might be denied by the ABI
3728 rules governing the call; see calls.c).
3730 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3731 can still reach the rest of BB. The case here is __builtin_sqrt,
3732 where the NaN result goes through the external function (with a
3733 tailcall) and the normal result happens via a sqrt instruction. */
3735 static basic_block
3736 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
3738 rtx_insn *last2, *last;
3739 edge e;
3740 edge_iterator ei;
3741 int probability;
3742 gcov_type count;
3744 last2 = last = expand_gimple_stmt (stmt);
3746 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3747 if (CALL_P (last) && SIBLING_CALL_P (last))
3748 goto found;
3750 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3752 *can_fallthru = true;
3753 return NULL;
3755 found:
3756 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3757 Any instructions emitted here are about to be deleted. */
3758 do_pending_stack_adjust ();
3760 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3761 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3762 EH or abnormal edges, we shouldn't have created a tail call in
3763 the first place. So it seems to me we should just be removing
3764 all edges here, or redirecting the existing fallthru edge to
3765 the exit block. */
3767 probability = 0;
3768 count = 0;
3770 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3772 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3774 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3776 e->dest->count -= e->count;
3777 e->dest->frequency -= EDGE_FREQUENCY (e);
3778 if (e->dest->count < 0)
3779 e->dest->count = 0;
3780 if (e->dest->frequency < 0)
3781 e->dest->frequency = 0;
3783 count += e->count;
3784 probability += e->probability;
3785 remove_edge (e);
3787 else
3788 ei_next (&ei);
3791 /* This is somewhat ugly: the call_expr expander often emits instructions
3792 after the sibcall (to perform the function return). These confuse the
3793 find_many_sub_basic_blocks code, so we need to get rid of these. */
3794 last = NEXT_INSN (last);
3795 gcc_assert (BARRIER_P (last));
3797 *can_fallthru = false;
3798 while (NEXT_INSN (last))
3800 /* For instance an sqrt builtin expander expands if with
3801 sibcall in the then and label for `else`. */
3802 if (LABEL_P (NEXT_INSN (last)))
3804 *can_fallthru = true;
3805 break;
3807 delete_insn (NEXT_INSN (last));
3810 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3811 | EDGE_SIBCALL);
3812 e->probability += probability;
3813 e->count += count;
3814 BB_END (bb) = last;
3815 update_bb_for_insn (bb);
3817 if (NEXT_INSN (last))
3819 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3821 last = BB_END (bb);
3822 if (BARRIER_P (last))
3823 BB_END (bb) = PREV_INSN (last);
3826 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3828 return bb;
3831 /* Return the difference between the floor and the truncated result of
3832 a signed division by OP1 with remainder MOD. */
3833 static rtx
3834 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3836 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
3837 return gen_rtx_IF_THEN_ELSE
3838 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3839 gen_rtx_IF_THEN_ELSE
3840 (mode, gen_rtx_LT (BImode,
3841 gen_rtx_DIV (mode, op1, mod),
3842 const0_rtx),
3843 constm1_rtx, const0_rtx),
3844 const0_rtx);
3847 /* Return the difference between the ceil and the truncated result of
3848 a signed division by OP1 with remainder MOD. */
3849 static rtx
3850 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3852 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
3853 return gen_rtx_IF_THEN_ELSE
3854 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3855 gen_rtx_IF_THEN_ELSE
3856 (mode, gen_rtx_GT (BImode,
3857 gen_rtx_DIV (mode, op1, mod),
3858 const0_rtx),
3859 const1_rtx, const0_rtx),
3860 const0_rtx);
3863 /* Return the difference between the ceil and the truncated result of
3864 an unsigned division by OP1 with remainder MOD. */
3865 static rtx
3866 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
3868 /* (mod != 0 ? 1 : 0) */
3869 return gen_rtx_IF_THEN_ELSE
3870 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3871 const1_rtx, const0_rtx);
3874 /* Return the difference between the rounded and the truncated result
3875 of a signed division by OP1 with remainder MOD. Halfway cases are
3876 rounded away from zero, rather than to the nearest even number. */
3877 static rtx
3878 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3880 /* (abs (mod) >= abs (op1) - abs (mod)
3881 ? (op1 / mod > 0 ? 1 : -1)
3882 : 0) */
3883 return gen_rtx_IF_THEN_ELSE
3884 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
3885 gen_rtx_MINUS (mode,
3886 gen_rtx_ABS (mode, op1),
3887 gen_rtx_ABS (mode, mod))),
3888 gen_rtx_IF_THEN_ELSE
3889 (mode, gen_rtx_GT (BImode,
3890 gen_rtx_DIV (mode, op1, mod),
3891 const0_rtx),
3892 const1_rtx, constm1_rtx),
3893 const0_rtx);
3896 /* Return the difference between the rounded and the truncated result
3897 of a unsigned division by OP1 with remainder MOD. Halfway cases
3898 are rounded away from zero, rather than to the nearest even
3899 number. */
3900 static rtx
3901 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
3903 /* (mod >= op1 - mod ? 1 : 0) */
3904 return gen_rtx_IF_THEN_ELSE
3905 (mode, gen_rtx_GE (BImode, mod,
3906 gen_rtx_MINUS (mode, op1, mod)),
3907 const1_rtx, const0_rtx);
3910 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
3911 any rtl. */
3913 static rtx
3914 convert_debug_memory_address (machine_mode mode, rtx x,
3915 addr_space_t as)
3917 machine_mode xmode = GET_MODE (x);
3919 #ifndef POINTERS_EXTEND_UNSIGNED
3920 gcc_assert (mode == Pmode
3921 || mode == targetm.addr_space.address_mode (as));
3922 gcc_assert (xmode == mode || xmode == VOIDmode);
3923 #else
3924 rtx temp;
3926 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
3928 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
3929 return x;
3931 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
3932 x = lowpart_subreg (mode, x, xmode);
3933 else if (POINTERS_EXTEND_UNSIGNED > 0)
3934 x = gen_rtx_ZERO_EXTEND (mode, x);
3935 else if (!POINTERS_EXTEND_UNSIGNED)
3936 x = gen_rtx_SIGN_EXTEND (mode, x);
3937 else
3939 switch (GET_CODE (x))
3941 case SUBREG:
3942 if ((SUBREG_PROMOTED_VAR_P (x)
3943 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
3944 || (GET_CODE (SUBREG_REG (x)) == PLUS
3945 && REG_P (XEXP (SUBREG_REG (x), 0))
3946 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
3947 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
3948 && GET_MODE (SUBREG_REG (x)) == mode)
3949 return SUBREG_REG (x);
3950 break;
3951 case LABEL_REF:
3952 temp = gen_rtx_LABEL_REF (mode, LABEL_REF_LABEL (x));
3953 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
3954 return temp;
3955 case SYMBOL_REF:
3956 temp = shallow_copy_rtx (x);
3957 PUT_MODE (temp, mode);
3958 return temp;
3959 case CONST:
3960 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
3961 if (temp)
3962 temp = gen_rtx_CONST (mode, temp);
3963 return temp;
3964 case PLUS:
3965 case MINUS:
3966 if (CONST_INT_P (XEXP (x, 1)))
3968 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
3969 if (temp)
3970 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
3972 break;
3973 default:
3974 break;
3976 /* Don't know how to express ptr_extend as operation in debug info. */
3977 return NULL;
3979 #endif /* POINTERS_EXTEND_UNSIGNED */
3981 return x;
3984 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
3985 by avoid_deep_ter_for_debug. */
3987 static hash_map<tree, tree> *deep_ter_debug_map;
3989 /* Split too deep TER chains for debug stmts using debug temporaries. */
3991 static void
3992 avoid_deep_ter_for_debug (gimple *stmt, int depth)
3994 use_operand_p use_p;
3995 ssa_op_iter iter;
3996 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
3998 tree use = USE_FROM_PTR (use_p);
3999 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4000 continue;
4001 gimple *g = get_gimple_for_ssa_name (use);
4002 if (g == NULL)
4003 continue;
4004 if (depth > 6 && !stmt_ends_bb_p (g))
4006 if (deep_ter_debug_map == NULL)
4007 deep_ter_debug_map = new hash_map<tree, tree>;
4009 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4010 if (vexpr != NULL)
4011 continue;
4012 vexpr = make_node (DEBUG_EXPR_DECL);
4013 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4014 DECL_ARTIFICIAL (vexpr) = 1;
4015 TREE_TYPE (vexpr) = TREE_TYPE (use);
4016 DECL_MODE (vexpr) = TYPE_MODE (TREE_TYPE (use));
4017 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4018 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4019 avoid_deep_ter_for_debug (def_temp, 0);
4021 else
4022 avoid_deep_ter_for_debug (g, depth + 1);
4026 /* Return an RTX equivalent to the value of the parameter DECL. */
4028 static rtx
4029 expand_debug_parm_decl (tree decl)
4031 rtx incoming = DECL_INCOMING_RTL (decl);
4033 if (incoming
4034 && GET_MODE (incoming) != BLKmode
4035 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4036 || (MEM_P (incoming)
4037 && REG_P (XEXP (incoming, 0))
4038 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4040 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4042 #ifdef HAVE_window_save
4043 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4044 If the target machine has an explicit window save instruction, the
4045 actual entry value is the corresponding OUTGOING_REGNO instead. */
4046 if (REG_P (incoming)
4047 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4048 incoming
4049 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4050 OUTGOING_REGNO (REGNO (incoming)), 0);
4051 else if (MEM_P (incoming))
4053 rtx reg = XEXP (incoming, 0);
4054 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4056 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4057 incoming = replace_equiv_address_nv (incoming, reg);
4059 else
4060 incoming = copy_rtx (incoming);
4062 #endif
4064 ENTRY_VALUE_EXP (rtl) = incoming;
4065 return rtl;
4068 if (incoming
4069 && GET_MODE (incoming) != BLKmode
4070 && !TREE_ADDRESSABLE (decl)
4071 && MEM_P (incoming)
4072 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4073 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4074 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4075 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4076 return copy_rtx (incoming);
4078 return NULL_RTX;
4081 /* Return an RTX equivalent to the value of the tree expression EXP. */
4083 static rtx
4084 expand_debug_expr (tree exp)
4086 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4087 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4088 machine_mode inner_mode = VOIDmode;
4089 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4090 addr_space_t as;
4092 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4094 case tcc_expression:
4095 switch (TREE_CODE (exp))
4097 case COND_EXPR:
4098 case DOT_PROD_EXPR:
4099 case SAD_EXPR:
4100 case WIDEN_MULT_PLUS_EXPR:
4101 case WIDEN_MULT_MINUS_EXPR:
4102 case FMA_EXPR:
4103 goto ternary;
4105 case TRUTH_ANDIF_EXPR:
4106 case TRUTH_ORIF_EXPR:
4107 case TRUTH_AND_EXPR:
4108 case TRUTH_OR_EXPR:
4109 case TRUTH_XOR_EXPR:
4110 goto binary;
4112 case TRUTH_NOT_EXPR:
4113 goto unary;
4115 default:
4116 break;
4118 break;
4120 ternary:
4121 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4122 if (!op2)
4123 return NULL_RTX;
4124 /* Fall through. */
4126 binary:
4127 case tcc_binary:
4128 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4129 if (!op1)
4130 return NULL_RTX;
4131 switch (TREE_CODE (exp))
4133 case LSHIFT_EXPR:
4134 case RSHIFT_EXPR:
4135 case LROTATE_EXPR:
4136 case RROTATE_EXPR:
4137 case WIDEN_LSHIFT_EXPR:
4138 /* Ensure second operand isn't wider than the first one. */
4139 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4140 if (SCALAR_INT_MODE_P (inner_mode))
4142 machine_mode opmode = mode;
4143 if (VECTOR_MODE_P (mode))
4144 opmode = GET_MODE_INNER (mode);
4145 if (SCALAR_INT_MODE_P (opmode)
4146 && (GET_MODE_PRECISION (opmode)
4147 < GET_MODE_PRECISION (inner_mode)))
4148 op1 = lowpart_subreg (opmode, op1, inner_mode);
4150 break;
4151 default:
4152 break;
4154 /* Fall through. */
4156 unary:
4157 case tcc_unary:
4158 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4159 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4160 if (!op0)
4161 return NULL_RTX;
4162 break;
4164 case tcc_comparison:
4165 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4166 goto binary;
4168 case tcc_type:
4169 case tcc_statement:
4170 gcc_unreachable ();
4172 case tcc_constant:
4173 case tcc_exceptional:
4174 case tcc_declaration:
4175 case tcc_reference:
4176 case tcc_vl_exp:
4177 break;
4180 switch (TREE_CODE (exp))
4182 case STRING_CST:
4183 if (!lookup_constant_def (exp))
4185 if (strlen (TREE_STRING_POINTER (exp)) + 1
4186 != (size_t) TREE_STRING_LENGTH (exp))
4187 return NULL_RTX;
4188 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4189 op0 = gen_rtx_MEM (BLKmode, op0);
4190 set_mem_attributes (op0, exp, 0);
4191 return op0;
4193 /* Fall through... */
4195 case INTEGER_CST:
4196 case REAL_CST:
4197 case FIXED_CST:
4198 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4199 return op0;
4201 case COMPLEX_CST:
4202 gcc_assert (COMPLEX_MODE_P (mode));
4203 op0 = expand_debug_expr (TREE_REALPART (exp));
4204 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4205 return gen_rtx_CONCAT (mode, op0, op1);
4207 case DEBUG_EXPR_DECL:
4208 op0 = DECL_RTL_IF_SET (exp);
4210 if (op0)
4211 return op0;
4213 op0 = gen_rtx_DEBUG_EXPR (mode);
4214 DEBUG_EXPR_TREE_DECL (op0) = exp;
4215 SET_DECL_RTL (exp, op0);
4217 return op0;
4219 case VAR_DECL:
4220 case PARM_DECL:
4221 case FUNCTION_DECL:
4222 case LABEL_DECL:
4223 case CONST_DECL:
4224 case RESULT_DECL:
4225 op0 = DECL_RTL_IF_SET (exp);
4227 /* This decl was probably optimized away. */
4228 if (!op0)
4230 if (TREE_CODE (exp) != VAR_DECL
4231 || DECL_EXTERNAL (exp)
4232 || !TREE_STATIC (exp)
4233 || !DECL_NAME (exp)
4234 || DECL_HARD_REGISTER (exp)
4235 || DECL_IN_CONSTANT_POOL (exp)
4236 || mode == VOIDmode)
4237 return NULL;
4239 op0 = make_decl_rtl_for_debug (exp);
4240 if (!MEM_P (op0)
4241 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4242 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4243 return NULL;
4245 else
4246 op0 = copy_rtx (op0);
4248 if (GET_MODE (op0) == BLKmode
4249 /* If op0 is not BLKmode, but mode is, adjust_mode
4250 below would ICE. While it is likely a FE bug,
4251 try to be robust here. See PR43166. */
4252 || mode == BLKmode
4253 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4255 gcc_assert (MEM_P (op0));
4256 op0 = adjust_address_nv (op0, mode, 0);
4257 return op0;
4260 /* Fall through. */
4262 adjust_mode:
4263 case PAREN_EXPR:
4264 CASE_CONVERT:
4266 inner_mode = GET_MODE (op0);
4268 if (mode == inner_mode)
4269 return op0;
4271 if (inner_mode == VOIDmode)
4273 if (TREE_CODE (exp) == SSA_NAME)
4274 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4275 else
4276 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4277 if (mode == inner_mode)
4278 return op0;
4281 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4283 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
4284 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4285 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
4286 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4287 else
4288 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4290 else if (FLOAT_MODE_P (mode))
4292 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4293 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4294 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4295 else
4296 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4298 else if (FLOAT_MODE_P (inner_mode))
4300 if (unsignedp)
4301 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4302 else
4303 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4305 else if (CONSTANT_P (op0)
4306 || GET_MODE_PRECISION (mode) <= GET_MODE_PRECISION (inner_mode))
4307 op0 = lowpart_subreg (mode, op0, inner_mode);
4308 else if (UNARY_CLASS_P (exp)
4309 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4310 : unsignedp)
4311 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4312 else
4313 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4315 return op0;
4318 case MEM_REF:
4319 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4321 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4322 TREE_OPERAND (exp, 0),
4323 TREE_OPERAND (exp, 1));
4324 if (newexp)
4325 return expand_debug_expr (newexp);
4327 /* FALLTHROUGH */
4328 case INDIRECT_REF:
4329 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4330 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4331 if (!op0)
4332 return NULL;
4334 if (TREE_CODE (exp) == MEM_REF)
4336 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4337 || (GET_CODE (op0) == PLUS
4338 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4339 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4340 Instead just use get_inner_reference. */
4341 goto component_ref;
4343 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4344 if (!op1 || !CONST_INT_P (op1))
4345 return NULL;
4347 op0 = plus_constant (inner_mode, op0, INTVAL (op1));
4350 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4352 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4353 op0, as);
4354 if (op0 == NULL_RTX)
4355 return NULL;
4357 op0 = gen_rtx_MEM (mode, op0);
4358 set_mem_attributes (op0, exp, 0);
4359 if (TREE_CODE (exp) == MEM_REF
4360 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4361 set_mem_expr (op0, NULL_TREE);
4362 set_mem_addr_space (op0, as);
4364 return op0;
4366 case TARGET_MEM_REF:
4367 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4368 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4369 return NULL;
4371 op0 = expand_debug_expr
4372 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4373 if (!op0)
4374 return NULL;
4376 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4377 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4378 op0, as);
4379 if (op0 == NULL_RTX)
4380 return NULL;
4382 op0 = gen_rtx_MEM (mode, op0);
4384 set_mem_attributes (op0, exp, 0);
4385 set_mem_addr_space (op0, as);
4387 return op0;
4389 component_ref:
4390 case ARRAY_REF:
4391 case ARRAY_RANGE_REF:
4392 case COMPONENT_REF:
4393 case BIT_FIELD_REF:
4394 case REALPART_EXPR:
4395 case IMAGPART_EXPR:
4396 case VIEW_CONVERT_EXPR:
4398 machine_mode mode1;
4399 HOST_WIDE_INT bitsize, bitpos;
4400 tree offset;
4401 int volatilep = 0;
4402 tree tem = get_inner_reference (exp, &bitsize, &bitpos, &offset,
4403 &mode1, &unsignedp, &volatilep, false);
4404 rtx orig_op0;
4406 if (bitsize == 0)
4407 return NULL;
4409 orig_op0 = op0 = expand_debug_expr (tem);
4411 if (!op0)
4412 return NULL;
4414 if (offset)
4416 machine_mode addrmode, offmode;
4418 if (!MEM_P (op0))
4419 return NULL;
4421 op0 = XEXP (op0, 0);
4422 addrmode = GET_MODE (op0);
4423 if (addrmode == VOIDmode)
4424 addrmode = Pmode;
4426 op1 = expand_debug_expr (offset);
4427 if (!op1)
4428 return NULL;
4430 offmode = GET_MODE (op1);
4431 if (offmode == VOIDmode)
4432 offmode = TYPE_MODE (TREE_TYPE (offset));
4434 if (addrmode != offmode)
4435 op1 = lowpart_subreg (addrmode, op1, offmode);
4437 /* Don't use offset_address here, we don't need a
4438 recognizable address, and we don't want to generate
4439 code. */
4440 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4441 op0, op1));
4444 if (MEM_P (op0))
4446 if (mode1 == VOIDmode)
4447 /* Bitfield. */
4448 mode1 = smallest_mode_for_size (bitsize, MODE_INT);
4449 if (bitpos >= BITS_PER_UNIT)
4451 op0 = adjust_address_nv (op0, mode1, bitpos / BITS_PER_UNIT);
4452 bitpos %= BITS_PER_UNIT;
4454 else if (bitpos < 0)
4456 HOST_WIDE_INT units
4457 = (-bitpos + BITS_PER_UNIT - 1) / BITS_PER_UNIT;
4458 op0 = adjust_address_nv (op0, mode1, units);
4459 bitpos += units * BITS_PER_UNIT;
4461 else if (bitpos == 0 && bitsize == GET_MODE_BITSIZE (mode))
4462 op0 = adjust_address_nv (op0, mode, 0);
4463 else if (GET_MODE (op0) != mode1)
4464 op0 = adjust_address_nv (op0, mode1, 0);
4465 else
4466 op0 = copy_rtx (op0);
4467 if (op0 == orig_op0)
4468 op0 = shallow_copy_rtx (op0);
4469 set_mem_attributes (op0, exp, 0);
4472 if (bitpos == 0 && mode == GET_MODE (op0))
4473 return op0;
4475 if (bitpos < 0)
4476 return NULL;
4478 if (GET_MODE (op0) == BLKmode)
4479 return NULL;
4481 if ((bitpos % BITS_PER_UNIT) == 0
4482 && bitsize == GET_MODE_BITSIZE (mode1))
4484 machine_mode opmode = GET_MODE (op0);
4486 if (opmode == VOIDmode)
4487 opmode = TYPE_MODE (TREE_TYPE (tem));
4489 /* This condition may hold if we're expanding the address
4490 right past the end of an array that turned out not to
4491 be addressable (i.e., the address was only computed in
4492 debug stmts). The gen_subreg below would rightfully
4493 crash, and the address doesn't really exist, so just
4494 drop it. */
4495 if (bitpos >= GET_MODE_BITSIZE (opmode))
4496 return NULL;
4498 if ((bitpos % GET_MODE_BITSIZE (mode)) == 0)
4499 return simplify_gen_subreg (mode, op0, opmode,
4500 bitpos / BITS_PER_UNIT);
4503 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4504 && TYPE_UNSIGNED (TREE_TYPE (exp))
4505 ? SIGN_EXTRACT
4506 : ZERO_EXTRACT, mode,
4507 GET_MODE (op0) != VOIDmode
4508 ? GET_MODE (op0)
4509 : TYPE_MODE (TREE_TYPE (tem)),
4510 op0, GEN_INT (bitsize), GEN_INT (bitpos));
4513 case ABS_EXPR:
4514 return simplify_gen_unary (ABS, mode, op0, mode);
4516 case NEGATE_EXPR:
4517 return simplify_gen_unary (NEG, mode, op0, mode);
4519 case BIT_NOT_EXPR:
4520 return simplify_gen_unary (NOT, mode, op0, mode);
4522 case FLOAT_EXPR:
4523 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4524 0)))
4525 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4526 inner_mode);
4528 case FIX_TRUNC_EXPR:
4529 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4530 inner_mode);
4532 case POINTER_PLUS_EXPR:
4533 /* For the rare target where pointers are not the same size as
4534 size_t, we need to check for mis-matched modes and correct
4535 the addend. */
4536 if (op0 && op1
4537 && GET_MODE (op0) != VOIDmode && GET_MODE (op1) != VOIDmode
4538 && GET_MODE (op0) != GET_MODE (op1))
4540 if (GET_MODE_BITSIZE (GET_MODE (op0)) < GET_MODE_BITSIZE (GET_MODE (op1))
4541 /* If OP0 is a partial mode, then we must truncate, even if it has
4542 the same bitsize as OP1 as GCC's representation of partial modes
4543 is opaque. */
4544 || (GET_MODE_CLASS (GET_MODE (op0)) == MODE_PARTIAL_INT
4545 && GET_MODE_BITSIZE (GET_MODE (op0)) == GET_MODE_BITSIZE (GET_MODE (op1))))
4546 op1 = simplify_gen_unary (TRUNCATE, GET_MODE (op0), op1,
4547 GET_MODE (op1));
4548 else
4549 /* We always sign-extend, regardless of the signedness of
4550 the operand, because the operand is always unsigned
4551 here even if the original C expression is signed. */
4552 op1 = simplify_gen_unary (SIGN_EXTEND, GET_MODE (op0), op1,
4553 GET_MODE (op1));
4555 /* Fall through. */
4556 case PLUS_EXPR:
4557 return simplify_gen_binary (PLUS, mode, op0, op1);
4559 case MINUS_EXPR:
4560 return simplify_gen_binary (MINUS, mode, op0, op1);
4562 case MULT_EXPR:
4563 return simplify_gen_binary (MULT, mode, op0, op1);
4565 case RDIV_EXPR:
4566 case TRUNC_DIV_EXPR:
4567 case EXACT_DIV_EXPR:
4568 if (unsignedp)
4569 return simplify_gen_binary (UDIV, mode, op0, op1);
4570 else
4571 return simplify_gen_binary (DIV, mode, op0, op1);
4573 case TRUNC_MOD_EXPR:
4574 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4576 case FLOOR_DIV_EXPR:
4577 if (unsignedp)
4578 return simplify_gen_binary (UDIV, mode, op0, op1);
4579 else
4581 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4582 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4583 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4584 return simplify_gen_binary (PLUS, mode, div, adj);
4587 case FLOOR_MOD_EXPR:
4588 if (unsignedp)
4589 return simplify_gen_binary (UMOD, mode, op0, op1);
4590 else
4592 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4593 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4594 adj = simplify_gen_unary (NEG, mode,
4595 simplify_gen_binary (MULT, mode, adj, op1),
4596 mode);
4597 return simplify_gen_binary (PLUS, mode, mod, adj);
4600 case CEIL_DIV_EXPR:
4601 if (unsignedp)
4603 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4604 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4605 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4606 return simplify_gen_binary (PLUS, mode, div, adj);
4608 else
4610 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4611 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4612 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4613 return simplify_gen_binary (PLUS, mode, div, adj);
4616 case CEIL_MOD_EXPR:
4617 if (unsignedp)
4619 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4620 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4621 adj = simplify_gen_unary (NEG, mode,
4622 simplify_gen_binary (MULT, mode, adj, op1),
4623 mode);
4624 return simplify_gen_binary (PLUS, mode, mod, adj);
4626 else
4628 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4629 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4630 adj = simplify_gen_unary (NEG, mode,
4631 simplify_gen_binary (MULT, mode, adj, op1),
4632 mode);
4633 return simplify_gen_binary (PLUS, mode, mod, adj);
4636 case ROUND_DIV_EXPR:
4637 if (unsignedp)
4639 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4640 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4641 rtx adj = round_udiv_adjust (mode, mod, op1);
4642 return simplify_gen_binary (PLUS, mode, div, adj);
4644 else
4646 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4647 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4648 rtx adj = round_sdiv_adjust (mode, mod, op1);
4649 return simplify_gen_binary (PLUS, mode, div, adj);
4652 case ROUND_MOD_EXPR:
4653 if (unsignedp)
4655 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4656 rtx adj = round_udiv_adjust (mode, mod, op1);
4657 adj = simplify_gen_unary (NEG, mode,
4658 simplify_gen_binary (MULT, mode, adj, op1),
4659 mode);
4660 return simplify_gen_binary (PLUS, mode, mod, adj);
4662 else
4664 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4665 rtx adj = round_sdiv_adjust (mode, mod, op1);
4666 adj = simplify_gen_unary (NEG, mode,
4667 simplify_gen_binary (MULT, mode, adj, op1),
4668 mode);
4669 return simplify_gen_binary (PLUS, mode, mod, adj);
4672 case LSHIFT_EXPR:
4673 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4675 case RSHIFT_EXPR:
4676 if (unsignedp)
4677 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4678 else
4679 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4681 case LROTATE_EXPR:
4682 return simplify_gen_binary (ROTATE, mode, op0, op1);
4684 case RROTATE_EXPR:
4685 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4687 case MIN_EXPR:
4688 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4690 case MAX_EXPR:
4691 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4693 case BIT_AND_EXPR:
4694 case TRUTH_AND_EXPR:
4695 return simplify_gen_binary (AND, mode, op0, op1);
4697 case BIT_IOR_EXPR:
4698 case TRUTH_OR_EXPR:
4699 return simplify_gen_binary (IOR, mode, op0, op1);
4701 case BIT_XOR_EXPR:
4702 case TRUTH_XOR_EXPR:
4703 return simplify_gen_binary (XOR, mode, op0, op1);
4705 case TRUTH_ANDIF_EXPR:
4706 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4708 case TRUTH_ORIF_EXPR:
4709 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4711 case TRUTH_NOT_EXPR:
4712 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4714 case LT_EXPR:
4715 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4716 op0, op1);
4718 case LE_EXPR:
4719 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4720 op0, op1);
4722 case GT_EXPR:
4723 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4724 op0, op1);
4726 case GE_EXPR:
4727 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4728 op0, op1);
4730 case EQ_EXPR:
4731 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4733 case NE_EXPR:
4734 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4736 case UNORDERED_EXPR:
4737 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4739 case ORDERED_EXPR:
4740 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4742 case UNLT_EXPR:
4743 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4745 case UNLE_EXPR:
4746 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4748 case UNGT_EXPR:
4749 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4751 case UNGE_EXPR:
4752 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4754 case UNEQ_EXPR:
4755 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4757 case LTGT_EXPR:
4758 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4760 case COND_EXPR:
4761 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4763 case COMPLEX_EXPR:
4764 gcc_assert (COMPLEX_MODE_P (mode));
4765 if (GET_MODE (op0) == VOIDmode)
4766 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4767 if (GET_MODE (op1) == VOIDmode)
4768 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4769 return gen_rtx_CONCAT (mode, op0, op1);
4771 case CONJ_EXPR:
4772 if (GET_CODE (op0) == CONCAT)
4773 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4774 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4775 XEXP (op0, 1),
4776 GET_MODE_INNER (mode)));
4777 else
4779 machine_mode imode = GET_MODE_INNER (mode);
4780 rtx re, im;
4782 if (MEM_P (op0))
4784 re = adjust_address_nv (op0, imode, 0);
4785 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4787 else
4789 machine_mode ifmode = int_mode_for_mode (mode);
4790 machine_mode ihmode = int_mode_for_mode (imode);
4791 rtx halfsize;
4792 if (ifmode == BLKmode || ihmode == BLKmode)
4793 return NULL;
4794 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4795 re = op0;
4796 if (mode != ifmode)
4797 re = gen_rtx_SUBREG (ifmode, re, 0);
4798 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4799 if (imode != ihmode)
4800 re = gen_rtx_SUBREG (imode, re, 0);
4801 im = copy_rtx (op0);
4802 if (mode != ifmode)
4803 im = gen_rtx_SUBREG (ifmode, im, 0);
4804 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4805 if (imode != ihmode)
4806 im = gen_rtx_SUBREG (imode, im, 0);
4808 im = gen_rtx_NEG (imode, im);
4809 return gen_rtx_CONCAT (mode, re, im);
4812 case ADDR_EXPR:
4813 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4814 if (!op0 || !MEM_P (op0))
4816 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
4817 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
4818 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
4819 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
4820 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
4821 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
4823 if (handled_component_p (TREE_OPERAND (exp, 0)))
4825 HOST_WIDE_INT bitoffset, bitsize, maxsize;
4826 tree decl
4827 = get_ref_base_and_extent (TREE_OPERAND (exp, 0),
4828 &bitoffset, &bitsize, &maxsize);
4829 if ((TREE_CODE (decl) == VAR_DECL
4830 || TREE_CODE (decl) == PARM_DECL
4831 || TREE_CODE (decl) == RESULT_DECL)
4832 && (!TREE_ADDRESSABLE (decl)
4833 || target_for_debug_bind (decl))
4834 && (bitoffset % BITS_PER_UNIT) == 0
4835 && bitsize > 0
4836 && bitsize == maxsize)
4838 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
4839 return plus_constant (mode, base, bitoffset / BITS_PER_UNIT);
4843 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
4844 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
4845 == ADDR_EXPR)
4847 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4848 0));
4849 if (op0 != NULL
4850 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4851 || (GET_CODE (op0) == PLUS
4852 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
4853 && CONST_INT_P (XEXP (op0, 1)))))
4855 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4856 1));
4857 if (!op1 || !CONST_INT_P (op1))
4858 return NULL;
4860 return plus_constant (mode, op0, INTVAL (op1));
4864 return NULL;
4867 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
4868 op0 = convert_debug_memory_address (mode, XEXP (op0, 0), as);
4870 return op0;
4872 case VECTOR_CST:
4874 unsigned i;
4876 op0 = gen_rtx_CONCATN
4877 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4879 for (i = 0; i < VECTOR_CST_NELTS (exp); ++i)
4881 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
4882 if (!op1)
4883 return NULL;
4884 XVECEXP (op0, 0, i) = op1;
4887 return op0;
4890 case CONSTRUCTOR:
4891 if (TREE_CLOBBER_P (exp))
4892 return NULL;
4893 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
4895 unsigned i;
4896 tree val;
4898 op0 = gen_rtx_CONCATN
4899 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4901 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
4903 op1 = expand_debug_expr (val);
4904 if (!op1)
4905 return NULL;
4906 XVECEXP (op0, 0, i) = op1;
4909 if (i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)))
4911 op1 = expand_debug_expr
4912 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
4914 if (!op1)
4915 return NULL;
4917 for (; i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)); i++)
4918 XVECEXP (op0, 0, i) = op1;
4921 return op0;
4923 else
4924 goto flag_unsupported;
4926 case CALL_EXPR:
4927 /* ??? Maybe handle some builtins? */
4928 return NULL;
4930 case SSA_NAME:
4932 gimple *g = get_gimple_for_ssa_name (exp);
4933 if (g)
4935 tree t = NULL_TREE;
4936 if (deep_ter_debug_map)
4938 tree *slot = deep_ter_debug_map->get (exp);
4939 if (slot)
4940 t = *slot;
4942 if (t == NULL_TREE)
4943 t = gimple_assign_rhs_to_tree (g);
4944 op0 = expand_debug_expr (t);
4945 if (!op0)
4946 return NULL;
4948 else
4950 int part = var_to_partition (SA.map, exp);
4952 if (part == NO_PARTITION)
4954 /* If this is a reference to an incoming value of parameter
4955 that is never used in the code or where the incoming
4956 value is never used in the code, use PARM_DECL's
4957 DECL_RTL if set. */
4958 if (SSA_NAME_IS_DEFAULT_DEF (exp)
4959 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL)
4961 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
4962 if (op0)
4963 goto adjust_mode;
4964 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
4965 if (op0)
4966 goto adjust_mode;
4968 return NULL;
4971 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
4973 op0 = copy_rtx (SA.partition_to_pseudo[part]);
4975 goto adjust_mode;
4978 case ERROR_MARK:
4979 return NULL;
4981 /* Vector stuff. For most of the codes we don't have rtl codes. */
4982 case REALIGN_LOAD_EXPR:
4983 case REDUC_MAX_EXPR:
4984 case REDUC_MIN_EXPR:
4985 case REDUC_PLUS_EXPR:
4986 case VEC_COND_EXPR:
4987 case VEC_PACK_FIX_TRUNC_EXPR:
4988 case VEC_PACK_SAT_EXPR:
4989 case VEC_PACK_TRUNC_EXPR:
4990 case VEC_UNPACK_FLOAT_HI_EXPR:
4991 case VEC_UNPACK_FLOAT_LO_EXPR:
4992 case VEC_UNPACK_HI_EXPR:
4993 case VEC_UNPACK_LO_EXPR:
4994 case VEC_WIDEN_MULT_HI_EXPR:
4995 case VEC_WIDEN_MULT_LO_EXPR:
4996 case VEC_WIDEN_MULT_EVEN_EXPR:
4997 case VEC_WIDEN_MULT_ODD_EXPR:
4998 case VEC_WIDEN_LSHIFT_HI_EXPR:
4999 case VEC_WIDEN_LSHIFT_LO_EXPR:
5000 case VEC_PERM_EXPR:
5001 return NULL;
5003 /* Misc codes. */
5004 case ADDR_SPACE_CONVERT_EXPR:
5005 case FIXED_CONVERT_EXPR:
5006 case OBJ_TYPE_REF:
5007 case WITH_SIZE_EXPR:
5008 return NULL;
5010 case DOT_PROD_EXPR:
5011 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5012 && SCALAR_INT_MODE_P (mode))
5015 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5016 0)))
5017 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5018 inner_mode);
5020 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5021 1)))
5022 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5023 inner_mode);
5024 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5025 return simplify_gen_binary (PLUS, mode, op0, op2);
5027 return NULL;
5029 case WIDEN_MULT_EXPR:
5030 case WIDEN_MULT_PLUS_EXPR:
5031 case WIDEN_MULT_MINUS_EXPR:
5032 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5033 && SCALAR_INT_MODE_P (mode))
5035 inner_mode = GET_MODE (op0);
5036 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5037 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5038 else
5039 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5040 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5041 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5042 else
5043 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5044 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5045 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5046 return op0;
5047 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5048 return simplify_gen_binary (PLUS, mode, op0, op2);
5049 else
5050 return simplify_gen_binary (MINUS, mode, op2, op0);
5052 return NULL;
5054 case MULT_HIGHPART_EXPR:
5055 /* ??? Similar to the above. */
5056 return NULL;
5058 case WIDEN_SUM_EXPR:
5059 case WIDEN_LSHIFT_EXPR:
5060 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5061 && SCALAR_INT_MODE_P (mode))
5064 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5065 0)))
5066 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5067 inner_mode);
5068 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5069 ? ASHIFT : PLUS, mode, op0, op1);
5071 return NULL;
5073 case FMA_EXPR:
5074 return simplify_gen_ternary (FMA, mode, inner_mode, op0, op1, op2);
5076 default:
5077 flag_unsupported:
5078 #ifdef ENABLE_CHECKING
5079 debug_tree (exp);
5080 gcc_unreachable ();
5081 #else
5082 return NULL;
5083 #endif
5087 /* Return an RTX equivalent to the source bind value of the tree expression
5088 EXP. */
5090 static rtx
5091 expand_debug_source_expr (tree exp)
5093 rtx op0 = NULL_RTX;
5094 machine_mode mode = VOIDmode, inner_mode;
5096 switch (TREE_CODE (exp))
5098 case PARM_DECL:
5100 mode = DECL_MODE (exp);
5101 op0 = expand_debug_parm_decl (exp);
5102 if (op0)
5103 break;
5104 /* See if this isn't an argument that has been completely
5105 optimized out. */
5106 if (!DECL_RTL_SET_P (exp)
5107 && !DECL_INCOMING_RTL (exp)
5108 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5110 tree aexp = DECL_ORIGIN (exp);
5111 if (DECL_CONTEXT (aexp)
5112 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5114 vec<tree, va_gc> **debug_args;
5115 unsigned int ix;
5116 tree ddecl;
5117 debug_args = decl_debug_args_lookup (current_function_decl);
5118 if (debug_args != NULL)
5120 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5121 ix += 2)
5122 if (ddecl == aexp)
5123 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5127 break;
5129 default:
5130 break;
5133 if (op0 == NULL_RTX)
5134 return NULL_RTX;
5136 inner_mode = GET_MODE (op0);
5137 if (mode == inner_mode)
5138 return op0;
5140 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5142 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
5143 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5144 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
5145 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5146 else
5147 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5149 else if (FLOAT_MODE_P (mode))
5150 gcc_unreachable ();
5151 else if (FLOAT_MODE_P (inner_mode))
5153 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5154 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5155 else
5156 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5158 else if (CONSTANT_P (op0)
5159 || GET_MODE_BITSIZE (mode) <= GET_MODE_BITSIZE (inner_mode))
5160 op0 = lowpart_subreg (mode, op0, inner_mode);
5161 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5162 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5163 else
5164 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5166 return op0;
5169 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5170 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5171 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5173 static void
5174 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5176 rtx exp = *exp_p;
5178 if (exp == NULL_RTX)
5179 return;
5181 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5182 return;
5184 if (depth == 4)
5186 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5187 rtx dval = make_debug_expr_from_rtl (exp);
5189 /* Emit a debug bind insn before INSN. */
5190 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5191 DEBUG_EXPR_TREE_DECL (dval), exp,
5192 VAR_INIT_STATUS_INITIALIZED);
5194 emit_debug_insn_before (bind, insn);
5195 *exp_p = dval;
5196 return;
5199 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5200 int i, j;
5201 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5202 switch (*format_ptr++)
5204 case 'e':
5205 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5206 break;
5208 case 'E':
5209 case 'V':
5210 for (j = 0; j < XVECLEN (exp, i); j++)
5211 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5212 break;
5214 default:
5215 break;
5219 /* Expand the _LOCs in debug insns. We run this after expanding all
5220 regular insns, so that any variables referenced in the function
5221 will have their DECL_RTLs set. */
5223 static void
5224 expand_debug_locations (void)
5226 rtx_insn *insn;
5227 rtx_insn *last = get_last_insn ();
5228 int save_strict_alias = flag_strict_aliasing;
5230 /* New alias sets while setting up memory attributes cause
5231 -fcompare-debug failures, even though it doesn't bring about any
5232 codegen changes. */
5233 flag_strict_aliasing = 0;
5235 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5236 if (DEBUG_INSN_P (insn))
5238 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5239 rtx val;
5240 rtx_insn *prev_insn, *insn2;
5241 machine_mode mode;
5243 if (value == NULL_TREE)
5244 val = NULL_RTX;
5245 else
5247 if (INSN_VAR_LOCATION_STATUS (insn)
5248 == VAR_INIT_STATUS_UNINITIALIZED)
5249 val = expand_debug_source_expr (value);
5250 /* The avoid_deep_ter_for_debug function inserts
5251 debug bind stmts after SSA_NAME definition, with the
5252 SSA_NAME as the whole bind location. Disable temporarily
5253 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5254 being defined in this DEBUG_INSN. */
5255 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5257 tree *slot = deep_ter_debug_map->get (value);
5258 if (slot)
5260 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5261 *slot = NULL_TREE;
5262 else
5263 slot = NULL;
5265 val = expand_debug_expr (value);
5266 if (slot)
5267 *slot = INSN_VAR_LOCATION_DECL (insn);
5269 else
5270 val = expand_debug_expr (value);
5271 gcc_assert (last == get_last_insn ());
5274 if (!val)
5275 val = gen_rtx_UNKNOWN_VAR_LOC ();
5276 else
5278 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5280 gcc_assert (mode == GET_MODE (val)
5281 || (GET_MODE (val) == VOIDmode
5282 && (CONST_SCALAR_INT_P (val)
5283 || GET_CODE (val) == CONST_FIXED
5284 || GET_CODE (val) == LABEL_REF)));
5287 INSN_VAR_LOCATION_LOC (insn) = val;
5288 prev_insn = PREV_INSN (insn);
5289 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5290 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5293 flag_strict_aliasing = save_strict_alias;
5296 /* Performs swapping operands of commutative operations to expand
5297 the expensive one first. */
5299 static void
5300 reorder_operands (basic_block bb)
5302 unsigned int *lattice; /* Hold cost of each statement. */
5303 unsigned int i = 0, n = 0;
5304 gimple_stmt_iterator gsi;
5305 gimple_seq stmts;
5306 gimple *stmt;
5307 bool swap;
5308 tree op0, op1;
5309 ssa_op_iter iter;
5310 use_operand_p use_p;
5311 gimple *def0, *def1;
5313 /* Compute cost of each statement using estimate_num_insns. */
5314 stmts = bb_seq (bb);
5315 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5317 stmt = gsi_stmt (gsi);
5318 if (!is_gimple_debug (stmt))
5319 gimple_set_uid (stmt, n++);
5321 lattice = XNEWVEC (unsigned int, n);
5322 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5324 unsigned cost;
5325 stmt = gsi_stmt (gsi);
5326 if (is_gimple_debug (stmt))
5327 continue;
5328 cost = estimate_num_insns (stmt, &eni_size_weights);
5329 lattice[i] = cost;
5330 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5332 tree use = USE_FROM_PTR (use_p);
5333 gimple *def_stmt;
5334 if (TREE_CODE (use) != SSA_NAME)
5335 continue;
5336 def_stmt = get_gimple_for_ssa_name (use);
5337 if (!def_stmt)
5338 continue;
5339 lattice[i] += lattice[gimple_uid (def_stmt)];
5341 i++;
5342 if (!is_gimple_assign (stmt)
5343 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5344 continue;
5345 op0 = gimple_op (stmt, 1);
5346 op1 = gimple_op (stmt, 2);
5347 if (TREE_CODE (op0) != SSA_NAME
5348 || TREE_CODE (op1) != SSA_NAME)
5349 continue;
5350 /* Swap operands if the second one is more expensive. */
5351 def0 = get_gimple_for_ssa_name (op0);
5352 def1 = get_gimple_for_ssa_name (op1);
5353 if (!def1)
5354 continue;
5355 swap = false;
5356 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5357 swap = true;
5358 if (swap)
5360 if (dump_file && (dump_flags & TDF_DETAILS))
5362 fprintf (dump_file, "Swap operands in stmt:\n");
5363 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5364 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5365 def0 ? lattice[gimple_uid (def0)] : 0,
5366 lattice[gimple_uid (def1)]);
5368 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5369 gimple_assign_rhs2_ptr (stmt));
5372 XDELETE (lattice);
5375 /* Expand basic block BB from GIMPLE trees to RTL. */
5377 static basic_block
5378 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5380 gimple_stmt_iterator gsi;
5381 gimple_seq stmts;
5382 gimple *stmt = NULL;
5383 rtx_note *note;
5384 rtx_insn *last;
5385 edge e;
5386 edge_iterator ei;
5388 if (dump_file)
5389 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5390 bb->index);
5392 /* Note that since we are now transitioning from GIMPLE to RTL, we
5393 cannot use the gsi_*_bb() routines because they expect the basic
5394 block to be in GIMPLE, instead of RTL. Therefore, we need to
5395 access the BB sequence directly. */
5396 if (optimize)
5397 reorder_operands (bb);
5398 stmts = bb_seq (bb);
5399 bb->il.gimple.seq = NULL;
5400 bb->il.gimple.phi_nodes = NULL;
5401 rtl_profile_for_bb (bb);
5402 init_rtl_bb_info (bb);
5403 bb->flags |= BB_RTL;
5405 /* Remove the RETURN_EXPR if we may fall though to the exit
5406 instead. */
5407 gsi = gsi_last (stmts);
5408 if (!gsi_end_p (gsi)
5409 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5411 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5413 gcc_assert (single_succ_p (bb));
5414 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5416 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5417 && !gimple_return_retval (ret_stmt))
5419 gsi_remove (&gsi, false);
5420 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5424 gsi = gsi_start (stmts);
5425 if (!gsi_end_p (gsi))
5427 stmt = gsi_stmt (gsi);
5428 if (gimple_code (stmt) != GIMPLE_LABEL)
5429 stmt = NULL;
5432 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5434 if (stmt || elt)
5436 last = get_last_insn ();
5438 if (stmt)
5440 expand_gimple_stmt (stmt);
5441 gsi_next (&gsi);
5444 if (elt)
5445 emit_label (*elt);
5447 /* Java emits line number notes in the top of labels.
5448 ??? Make this go away once line number notes are obsoleted. */
5449 BB_HEAD (bb) = NEXT_INSN (last);
5450 if (NOTE_P (BB_HEAD (bb)))
5451 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5452 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5454 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5456 else
5457 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5459 NOTE_BASIC_BLOCK (note) = bb;
5461 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5463 basic_block new_bb;
5465 stmt = gsi_stmt (gsi);
5467 /* If this statement is a non-debug one, and we generate debug
5468 insns, then this one might be the last real use of a TERed
5469 SSA_NAME, but where there are still some debug uses further
5470 down. Expanding the current SSA name in such further debug
5471 uses by their RHS might lead to wrong debug info, as coalescing
5472 might make the operands of such RHS be placed into the same
5473 pseudo as something else. Like so:
5474 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5475 use(a_1);
5476 a_2 = ...
5477 #DEBUG ... => a_1
5478 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5479 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5480 the write to a_2 would actually have clobbered the place which
5481 formerly held a_0.
5483 So, instead of that, we recognize the situation, and generate
5484 debug temporaries at the last real use of TERed SSA names:
5485 a_1 = a_0 + 1;
5486 #DEBUG #D1 => a_1
5487 use(a_1);
5488 a_2 = ...
5489 #DEBUG ... => #D1
5491 if (MAY_HAVE_DEBUG_INSNS
5492 && SA.values
5493 && !is_gimple_debug (stmt))
5495 ssa_op_iter iter;
5496 tree op;
5497 gimple *def;
5499 location_t sloc = curr_insn_location ();
5501 /* Look for SSA names that have their last use here (TERed
5502 names always have only one real use). */
5503 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5504 if ((def = get_gimple_for_ssa_name (op)))
5506 imm_use_iterator imm_iter;
5507 use_operand_p use_p;
5508 bool have_debug_uses = false;
5510 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5512 if (gimple_debug_bind_p (USE_STMT (use_p)))
5514 have_debug_uses = true;
5515 break;
5519 if (have_debug_uses)
5521 /* OP is a TERed SSA name, with DEF its defining
5522 statement, and where OP is used in further debug
5523 instructions. Generate a debug temporary, and
5524 replace all uses of OP in debug insns with that
5525 temporary. */
5526 gimple *debugstmt;
5527 tree value = gimple_assign_rhs_to_tree (def);
5528 tree vexpr = make_node (DEBUG_EXPR_DECL);
5529 rtx val;
5530 machine_mode mode;
5532 set_curr_insn_location (gimple_location (def));
5534 DECL_ARTIFICIAL (vexpr) = 1;
5535 TREE_TYPE (vexpr) = TREE_TYPE (value);
5536 if (DECL_P (value))
5537 mode = DECL_MODE (value);
5538 else
5539 mode = TYPE_MODE (TREE_TYPE (value));
5540 DECL_MODE (vexpr) = mode;
5542 val = gen_rtx_VAR_LOCATION
5543 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5545 emit_debug_insn (val);
5547 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5549 if (!gimple_debug_bind_p (debugstmt))
5550 continue;
5552 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5553 SET_USE (use_p, vexpr);
5555 update_stmt (debugstmt);
5559 set_curr_insn_location (sloc);
5562 currently_expanding_gimple_stmt = stmt;
5564 /* Expand this statement, then evaluate the resulting RTL and
5565 fixup the CFG accordingly. */
5566 if (gimple_code (stmt) == GIMPLE_COND)
5568 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5569 if (new_bb)
5570 return new_bb;
5572 else if (gimple_debug_bind_p (stmt))
5574 location_t sloc = curr_insn_location ();
5575 gimple_stmt_iterator nsi = gsi;
5577 for (;;)
5579 tree var = gimple_debug_bind_get_var (stmt);
5580 tree value;
5581 rtx val;
5582 machine_mode mode;
5584 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5585 && TREE_CODE (var) != LABEL_DECL
5586 && !target_for_debug_bind (var))
5587 goto delink_debug_stmt;
5589 if (gimple_debug_bind_has_value_p (stmt))
5590 value = gimple_debug_bind_get_value (stmt);
5591 else
5592 value = NULL_TREE;
5594 last = get_last_insn ();
5596 set_curr_insn_location (gimple_location (stmt));
5598 if (DECL_P (var))
5599 mode = DECL_MODE (var);
5600 else
5601 mode = TYPE_MODE (TREE_TYPE (var));
5603 val = gen_rtx_VAR_LOCATION
5604 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5606 emit_debug_insn (val);
5608 if (dump_file && (dump_flags & TDF_DETAILS))
5610 /* We can't dump the insn with a TREE where an RTX
5611 is expected. */
5612 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5613 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5614 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5617 delink_debug_stmt:
5618 /* In order not to generate too many debug temporaries,
5619 we delink all uses of debug statements we already expanded.
5620 Therefore debug statements between definition and real
5621 use of TERed SSA names will continue to use the SSA name,
5622 and not be replaced with debug temps. */
5623 delink_stmt_imm_use (stmt);
5625 gsi = nsi;
5626 gsi_next (&nsi);
5627 if (gsi_end_p (nsi))
5628 break;
5629 stmt = gsi_stmt (nsi);
5630 if (!gimple_debug_bind_p (stmt))
5631 break;
5634 set_curr_insn_location (sloc);
5636 else if (gimple_debug_source_bind_p (stmt))
5638 location_t sloc = curr_insn_location ();
5639 tree var = gimple_debug_source_bind_get_var (stmt);
5640 tree value = gimple_debug_source_bind_get_value (stmt);
5641 rtx val;
5642 machine_mode mode;
5644 last = get_last_insn ();
5646 set_curr_insn_location (gimple_location (stmt));
5648 mode = DECL_MODE (var);
5650 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5651 VAR_INIT_STATUS_UNINITIALIZED);
5653 emit_debug_insn (val);
5655 if (dump_file && (dump_flags & TDF_DETAILS))
5657 /* We can't dump the insn with a TREE where an RTX
5658 is expected. */
5659 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5660 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5661 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5664 set_curr_insn_location (sloc);
5666 else
5668 gcall *call_stmt = dyn_cast <gcall *> (stmt);
5669 if (call_stmt
5670 && gimple_call_tail_p (call_stmt)
5671 && disable_tail_calls)
5672 gimple_call_set_tail (call_stmt, false);
5674 if (call_stmt && gimple_call_tail_p (call_stmt))
5676 bool can_fallthru;
5677 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
5678 if (new_bb)
5680 if (can_fallthru)
5681 bb = new_bb;
5682 else
5683 return new_bb;
5686 else
5688 def_operand_p def_p;
5689 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5691 if (def_p != NULL)
5693 /* Ignore this stmt if it is in the list of
5694 replaceable expressions. */
5695 if (SA.values
5696 && bitmap_bit_p (SA.values,
5697 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5698 continue;
5700 last = expand_gimple_stmt (stmt);
5701 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5706 currently_expanding_gimple_stmt = NULL;
5708 /* Expand implicit goto and convert goto_locus. */
5709 FOR_EACH_EDGE (e, ei, bb->succs)
5711 if (e->goto_locus != UNKNOWN_LOCATION)
5712 set_curr_insn_location (e->goto_locus);
5713 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5715 emit_jump (label_rtx_for_bb (e->dest));
5716 e->flags &= ~EDGE_FALLTHRU;
5720 /* Expanded RTL can create a jump in the last instruction of block.
5721 This later might be assumed to be a jump to successor and break edge insertion.
5722 We need to insert dummy move to prevent this. PR41440. */
5723 if (single_succ_p (bb)
5724 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5725 && (last = get_last_insn ())
5726 && JUMP_P (last))
5728 rtx dummy = gen_reg_rtx (SImode);
5729 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5732 do_pending_stack_adjust ();
5734 /* Find the block tail. The last insn in the block is the insn
5735 before a barrier and/or table jump insn. */
5736 last = get_last_insn ();
5737 if (BARRIER_P (last))
5738 last = PREV_INSN (last);
5739 if (JUMP_TABLE_DATA_P (last))
5740 last = PREV_INSN (PREV_INSN (last));
5741 BB_END (bb) = last;
5743 update_bb_for_insn (bb);
5745 return bb;
5749 /* Create a basic block for initialization code. */
5751 static basic_block
5752 construct_init_block (void)
5754 basic_block init_block, first_block;
5755 edge e = NULL;
5756 int flags;
5758 /* Multiple entry points not supported yet. */
5759 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5760 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5761 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5762 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5763 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5765 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5767 /* When entry edge points to first basic block, we don't need jump,
5768 otherwise we have to jump into proper target. */
5769 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5771 tree label = gimple_block_label (e->dest);
5773 emit_jump (jump_target_rtx (label));
5774 flags = 0;
5776 else
5777 flags = EDGE_FALLTHRU;
5779 init_block = create_basic_block (NEXT_INSN (get_insns ()),
5780 get_last_insn (),
5781 ENTRY_BLOCK_PTR_FOR_FN (cfun));
5782 init_block->frequency = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency;
5783 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5784 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5785 if (e)
5787 first_block = e->dest;
5788 redirect_edge_succ (e, init_block);
5789 e = make_edge (init_block, first_block, flags);
5791 else
5792 e = make_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_FALLTHRU);
5793 e->probability = REG_BR_PROB_BASE;
5794 e->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5796 update_bb_for_insn (init_block);
5797 return init_block;
5800 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
5801 found in the block tree. */
5803 static void
5804 set_block_levels (tree block, int level)
5806 while (block)
5808 BLOCK_NUMBER (block) = level;
5809 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
5810 block = BLOCK_CHAIN (block);
5814 /* Create a block containing landing pads and similar stuff. */
5816 static void
5817 construct_exit_block (void)
5819 rtx_insn *head = get_last_insn ();
5820 rtx_insn *end;
5821 basic_block exit_block;
5822 edge e, e2;
5823 unsigned ix;
5824 edge_iterator ei;
5825 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
5826 rtx_insn *orig_end = BB_END (prev_bb);
5828 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5830 /* Make sure the locus is set to the end of the function, so that
5831 epilogue line numbers and warnings are set properly. */
5832 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
5833 input_location = cfun->function_end_locus;
5835 /* Generate rtl for function exit. */
5836 expand_function_end ();
5838 end = get_last_insn ();
5839 if (head == end)
5840 return;
5841 /* While emitting the function end we could move end of the last basic
5842 block. */
5843 BB_END (prev_bb) = orig_end;
5844 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
5845 head = NEXT_INSN (head);
5846 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
5847 bb frequency counting will be confused. Any instructions before that
5848 label are emitted for the case where PREV_BB falls through into the
5849 exit block, so append those instructions to prev_bb in that case. */
5850 if (NEXT_INSN (head) != return_label)
5852 while (NEXT_INSN (head) != return_label)
5854 if (!NOTE_P (NEXT_INSN (head)))
5855 BB_END (prev_bb) = NEXT_INSN (head);
5856 head = NEXT_INSN (head);
5859 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
5860 exit_block->frequency = EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency;
5861 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5862 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5864 ix = 0;
5865 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
5867 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
5868 if (!(e->flags & EDGE_ABNORMAL))
5869 redirect_edge_succ (e, exit_block);
5870 else
5871 ix++;
5874 e = make_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_FALLTHRU);
5875 e->probability = REG_BR_PROB_BASE;
5876 e->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5877 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
5878 if (e2 != e)
5880 e->count -= e2->count;
5881 exit_block->count -= e2->count;
5882 exit_block->frequency -= EDGE_FREQUENCY (e2);
5884 if (e->count < 0)
5885 e->count = 0;
5886 if (exit_block->count < 0)
5887 exit_block->count = 0;
5888 if (exit_block->frequency < 0)
5889 exit_block->frequency = 0;
5890 update_bb_for_insn (exit_block);
5893 /* Helper function for discover_nonconstant_array_refs.
5894 Look for ARRAY_REF nodes with non-constant indexes and mark them
5895 addressable. */
5897 static tree
5898 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
5899 void *data ATTRIBUTE_UNUSED)
5901 tree t = *tp;
5903 if (IS_TYPE_OR_DECL_P (t))
5904 *walk_subtrees = 0;
5905 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5907 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5908 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
5909 && (!TREE_OPERAND (t, 2)
5910 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5911 || (TREE_CODE (t) == COMPONENT_REF
5912 && (!TREE_OPERAND (t,2)
5913 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5914 || TREE_CODE (t) == BIT_FIELD_REF
5915 || TREE_CODE (t) == REALPART_EXPR
5916 || TREE_CODE (t) == IMAGPART_EXPR
5917 || TREE_CODE (t) == VIEW_CONVERT_EXPR
5918 || CONVERT_EXPR_P (t))
5919 t = TREE_OPERAND (t, 0);
5921 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5923 t = get_base_address (t);
5924 if (t && DECL_P (t)
5925 && DECL_MODE (t) != BLKmode)
5926 TREE_ADDRESSABLE (t) = 1;
5929 *walk_subtrees = 0;
5932 return NULL_TREE;
5935 /* RTL expansion is not able to compile array references with variable
5936 offsets for arrays stored in single register. Discover such
5937 expressions and mark variables as addressable to avoid this
5938 scenario. */
5940 static void
5941 discover_nonconstant_array_refs (void)
5943 basic_block bb;
5944 gimple_stmt_iterator gsi;
5946 FOR_EACH_BB_FN (bb, cfun)
5947 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
5949 gimple *stmt = gsi_stmt (gsi);
5950 if (!is_gimple_debug (stmt))
5951 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
5955 /* This function sets crtl->args.internal_arg_pointer to a virtual
5956 register if DRAP is needed. Local register allocator will replace
5957 virtual_incoming_args_rtx with the virtual register. */
5959 static void
5960 expand_stack_alignment (void)
5962 rtx drap_rtx;
5963 unsigned int preferred_stack_boundary;
5965 if (! SUPPORTS_STACK_ALIGNMENT)
5966 return;
5968 if (cfun->calls_alloca
5969 || cfun->has_nonlocal_label
5970 || crtl->has_nonlocal_goto)
5971 crtl->need_drap = true;
5973 /* Call update_stack_boundary here again to update incoming stack
5974 boundary. It may set incoming stack alignment to a different
5975 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
5976 use the minimum incoming stack alignment to check if it is OK
5977 to perform sibcall optimization since sibcall optimization will
5978 only align the outgoing stack to incoming stack boundary. */
5979 if (targetm.calls.update_stack_boundary)
5980 targetm.calls.update_stack_boundary ();
5982 /* The incoming stack frame has to be aligned at least at
5983 parm_stack_boundary. */
5984 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
5986 /* Update crtl->stack_alignment_estimated and use it later to align
5987 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
5988 exceptions since callgraph doesn't collect incoming stack alignment
5989 in this case. */
5990 if (cfun->can_throw_non_call_exceptions
5991 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
5992 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
5993 else
5994 preferred_stack_boundary = crtl->preferred_stack_boundary;
5995 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
5996 crtl->stack_alignment_estimated = preferred_stack_boundary;
5997 if (preferred_stack_boundary > crtl->stack_alignment_needed)
5998 crtl->stack_alignment_needed = preferred_stack_boundary;
6000 gcc_assert (crtl->stack_alignment_needed
6001 <= crtl->stack_alignment_estimated);
6003 crtl->stack_realign_needed
6004 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6005 crtl->stack_realign_tried = crtl->stack_realign_needed;
6007 crtl->stack_realign_processed = true;
6009 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6010 alignment. */
6011 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6012 drap_rtx = targetm.calls.get_drap_rtx ();
6014 /* stack_realign_drap and drap_rtx must match. */
6015 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6017 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6018 if (NULL != drap_rtx)
6020 crtl->args.internal_arg_pointer = drap_rtx;
6022 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6023 needed. */
6024 fixup_tail_calls ();
6029 static void
6030 expand_main_function (void)
6032 #if (defined(INVOKE__main) \
6033 || (!defined(HAS_INIT_SECTION) \
6034 && !defined(INIT_SECTION_ASM_OP) \
6035 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6036 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode, 0);
6037 #endif
6041 /* Expand code to initialize the stack_protect_guard. This is invoked at
6042 the beginning of a function to be protected. */
6044 static void
6045 stack_protect_prologue (void)
6047 tree guard_decl = targetm.stack_protect_guard ();
6048 rtx x, y;
6050 x = expand_normal (crtl->stack_protect_guard);
6051 y = expand_normal (guard_decl);
6053 /* Allow the target to copy from Y to X without leaking Y into a
6054 register. */
6055 if (targetm.have_stack_protect_set ())
6056 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6058 emit_insn (insn);
6059 return;
6062 /* Otherwise do a straight move. */
6063 emit_move_insn (x, y);
6066 /* Translate the intermediate representation contained in the CFG
6067 from GIMPLE trees to RTL.
6069 We do conversion per basic block and preserve/update the tree CFG.
6070 This implies we have to do some magic as the CFG can simultaneously
6071 consist of basic blocks containing RTL and GIMPLE trees. This can
6072 confuse the CFG hooks, so be careful to not manipulate CFG during
6073 the expansion. */
6075 namespace {
6077 const pass_data pass_data_expand =
6079 RTL_PASS, /* type */
6080 "expand", /* name */
6081 OPTGROUP_NONE, /* optinfo_flags */
6082 TV_EXPAND, /* tv_id */
6083 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6084 | PROP_gimple_lcx
6085 | PROP_gimple_lvec
6086 | PROP_gimple_lva), /* properties_required */
6087 PROP_rtl, /* properties_provided */
6088 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
6089 0, /* todo_flags_start */
6090 0, /* todo_flags_finish */
6093 class pass_expand : public rtl_opt_pass
6095 public:
6096 pass_expand (gcc::context *ctxt)
6097 : rtl_opt_pass (pass_data_expand, ctxt)
6100 /* opt_pass methods: */
6101 virtual unsigned int execute (function *);
6103 }; // class pass_expand
6105 unsigned int
6106 pass_expand::execute (function *fun)
6108 basic_block bb, init_block;
6109 sbitmap blocks;
6110 edge_iterator ei;
6111 edge e;
6112 rtx_insn *var_seq, *var_ret_seq;
6113 unsigned i;
6115 timevar_push (TV_OUT_OF_SSA);
6116 rewrite_out_of_ssa (&SA);
6117 timevar_pop (TV_OUT_OF_SSA);
6118 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6120 if (MAY_HAVE_DEBUG_STMTS && flag_tree_ter)
6122 gimple_stmt_iterator gsi;
6123 FOR_EACH_BB_FN (bb, cfun)
6124 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6125 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6126 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6129 /* Make sure all values used by the optimization passes have sane
6130 defaults. */
6131 reg_renumber = 0;
6133 /* Some backends want to know that we are expanding to RTL. */
6134 currently_expanding_to_rtl = 1;
6135 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6136 free_dominance_info (CDI_DOMINATORS);
6138 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6140 if (chkp_function_instrumented_p (current_function_decl))
6141 chkp_reset_rtl_bounds ();
6143 insn_locations_init ();
6144 if (!DECL_IS_BUILTIN (current_function_decl))
6146 /* Eventually, all FEs should explicitly set function_start_locus. */
6147 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6148 set_curr_insn_location
6149 (DECL_SOURCE_LOCATION (current_function_decl));
6150 else
6151 set_curr_insn_location (fun->function_start_locus);
6153 else
6154 set_curr_insn_location (UNKNOWN_LOCATION);
6155 prologue_location = curr_insn_location ();
6157 #ifdef INSN_SCHEDULING
6158 init_sched_attrs ();
6159 #endif
6161 /* Make sure first insn is a note even if we don't want linenums.
6162 This makes sure the first insn will never be deleted.
6163 Also, final expects a note to appear there. */
6164 emit_note (NOTE_INSN_DELETED);
6166 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6167 discover_nonconstant_array_refs ();
6169 targetm.expand_to_rtl_hook ();
6170 crtl->stack_alignment_needed = STACK_BOUNDARY;
6171 crtl->max_used_stack_slot_alignment = STACK_BOUNDARY;
6172 crtl->stack_alignment_estimated = 0;
6173 crtl->preferred_stack_boundary = STACK_BOUNDARY;
6174 fun->cfg->max_jumptable_ents = 0;
6176 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6177 of the function section at exapnsion time to predict distance of calls. */
6178 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6180 /* Expand the variables recorded during gimple lowering. */
6181 timevar_push (TV_VAR_EXPAND);
6182 start_sequence ();
6184 var_ret_seq = expand_used_vars ();
6186 var_seq = get_insns ();
6187 end_sequence ();
6188 timevar_pop (TV_VAR_EXPAND);
6190 /* Honor stack protection warnings. */
6191 if (warn_stack_protect)
6193 if (fun->calls_alloca)
6194 warning (OPT_Wstack_protector,
6195 "stack protector not protecting local variables: "
6196 "variable length buffer");
6197 if (has_short_buffer && !crtl->stack_protect_guard)
6198 warning (OPT_Wstack_protector,
6199 "stack protector not protecting function: "
6200 "all local arrays are less than %d bytes long",
6201 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE));
6204 /* Set up parameters and prepare for return, for the function. */
6205 expand_function_start (current_function_decl);
6207 /* If we emitted any instructions for setting up the variables,
6208 emit them before the FUNCTION_START note. */
6209 if (var_seq)
6211 emit_insn_before (var_seq, parm_birth_insn);
6213 /* In expand_function_end we'll insert the alloca save/restore
6214 before parm_birth_insn. We've just insertted an alloca call.
6215 Adjust the pointer to match. */
6216 parm_birth_insn = var_seq;
6219 /* If we have a class containing differently aligned pointers
6220 we need to merge those into the corresponding RTL pointer
6221 alignment. */
6222 for (i = 1; i < num_ssa_names; i++)
6224 tree name = ssa_name (i);
6225 int part;
6227 if (!name
6228 /* We might have generated new SSA names in
6229 update_alias_info_with_stack_vars. They will have a NULL
6230 defining statements, and won't be part of the partitioning,
6231 so ignore those. */
6232 || !SSA_NAME_DEF_STMT (name))
6233 continue;
6234 part = var_to_partition (SA.map, name);
6235 if (part == NO_PARTITION)
6236 continue;
6238 gcc_assert (SA.partition_to_pseudo[part]
6239 || defer_stack_allocation (name, true));
6241 /* If this decl was marked as living in multiple places, reset
6242 this now to NULL. */
6243 tree var = SSA_NAME_VAR (name);
6244 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6245 SET_DECL_RTL (var, NULL);
6246 /* Check that the pseudos chosen by assign_parms are those of
6247 the corresponding default defs. */
6248 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6249 && (TREE_CODE (var) == PARM_DECL
6250 || TREE_CODE (var) == RESULT_DECL))
6252 rtx in = DECL_RTL_IF_SET (var);
6253 gcc_assert (in);
6254 rtx out = SA.partition_to_pseudo[part];
6255 gcc_assert (in == out || rtx_equal_p (in, out));
6259 /* If this function is `main', emit a call to `__main'
6260 to run global initializers, etc. */
6261 if (DECL_NAME (current_function_decl)
6262 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6263 && DECL_FILE_SCOPE_P (current_function_decl))
6264 expand_main_function ();
6266 /* Initialize the stack_protect_guard field. This must happen after the
6267 call to __main (if any) so that the external decl is initialized. */
6268 if (crtl->stack_protect_guard)
6269 stack_protect_prologue ();
6271 expand_phi_nodes (&SA);
6273 /* Register rtl specific functions for cfg. */
6274 rtl_register_cfg_hooks ();
6276 init_block = construct_init_block ();
6278 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6279 remaining edges later. */
6280 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6281 e->flags &= ~EDGE_EXECUTABLE;
6283 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6284 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6285 next_bb)
6286 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6288 if (MAY_HAVE_DEBUG_INSNS)
6289 expand_debug_locations ();
6291 if (deep_ter_debug_map)
6293 delete deep_ter_debug_map;
6294 deep_ter_debug_map = NULL;
6297 /* Free stuff we no longer need after GIMPLE optimizations. */
6298 free_dominance_info (CDI_DOMINATORS);
6299 free_dominance_info (CDI_POST_DOMINATORS);
6300 delete_tree_cfg_annotations ();
6302 timevar_push (TV_OUT_OF_SSA);
6303 finish_out_of_ssa (&SA);
6304 timevar_pop (TV_OUT_OF_SSA);
6306 timevar_push (TV_POST_EXPAND);
6307 /* We are no longer in SSA form. */
6308 fun->gimple_df->in_ssa_p = false;
6309 loops_state_clear (LOOP_CLOSED_SSA);
6311 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6312 conservatively to true until they are all profile aware. */
6313 delete lab_rtx_for_bb;
6314 free_histograms ();
6316 construct_exit_block ();
6317 insn_locations_finalize ();
6319 if (var_ret_seq)
6321 rtx_insn *after = return_label;
6322 rtx_insn *next = NEXT_INSN (after);
6323 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6324 after = next;
6325 emit_insn_after (var_ret_seq, after);
6328 /* Zap the tree EH table. */
6329 set_eh_throw_stmt_table (fun, NULL);
6331 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6332 split edges which edge insertions might do. */
6333 rebuild_jump_labels (get_insns ());
6335 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun),
6336 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6338 edge e;
6339 edge_iterator ei;
6340 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6342 if (e->insns.r)
6344 rebuild_jump_labels_chain (e->insns.r);
6345 /* Put insns after parm birth, but before
6346 NOTE_INSNS_FUNCTION_BEG. */
6347 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (fun)
6348 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6350 rtx_insn *insns = e->insns.r;
6351 e->insns.r = NULL;
6352 if (NOTE_P (parm_birth_insn)
6353 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6354 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6355 else
6356 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6358 else
6359 commit_one_edge_insertion (e);
6361 else
6362 ei_next (&ei);
6366 /* We're done expanding trees to RTL. */
6367 currently_expanding_to_rtl = 0;
6369 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6370 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6372 edge e;
6373 edge_iterator ei;
6374 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6376 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6377 e->flags &= ~EDGE_EXECUTABLE;
6379 /* At the moment not all abnormal edges match the RTL
6380 representation. It is safe to remove them here as
6381 find_many_sub_basic_blocks will rediscover them.
6382 In the future we should get this fixed properly. */
6383 if ((e->flags & EDGE_ABNORMAL)
6384 && !(e->flags & EDGE_SIBCALL))
6385 remove_edge (e);
6386 else
6387 ei_next (&ei);
6391 blocks = sbitmap_alloc (last_basic_block_for_fn (fun));
6392 bitmap_ones (blocks);
6393 find_many_sub_basic_blocks (blocks);
6394 sbitmap_free (blocks);
6395 purge_all_dead_edges ();
6397 expand_stack_alignment ();
6399 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6400 function. */
6401 if (crtl->tail_call_emit)
6402 fixup_tail_calls ();
6404 /* After initial rtl generation, call back to finish generating
6405 exception support code. We need to do this before cleaning up
6406 the CFG as the code does not expect dead landing pads. */
6407 if (fun->eh->region_tree != NULL)
6408 finish_eh_generation ();
6410 /* Remove unreachable blocks, otherwise we cannot compute dominators
6411 which are needed for loop state verification. As a side-effect
6412 this also compacts blocks.
6413 ??? We cannot remove trivially dead insns here as for example
6414 the DRAP reg on i?86 is not magically live at this point.
6415 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6416 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6418 #ifdef ENABLE_CHECKING
6419 verify_flow_info ();
6420 #endif
6422 /* Initialize pseudos allocated for hard registers. */
6423 emit_initial_value_sets ();
6425 /* And finally unshare all RTL. */
6426 unshare_all_rtl ();
6428 /* There's no need to defer outputting this function any more; we
6429 know we want to output it. */
6430 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6432 /* Now that we're done expanding trees to RTL, we shouldn't have any
6433 more CONCATs anywhere. */
6434 generating_concat_p = 0;
6436 if (dump_file)
6438 fprintf (dump_file,
6439 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6440 /* And the pass manager will dump RTL for us. */
6443 /* If we're emitting a nested function, make sure its parent gets
6444 emitted as well. Doing otherwise confuses debug info. */
6446 tree parent;
6447 for (parent = DECL_CONTEXT (current_function_decl);
6448 parent != NULL_TREE;
6449 parent = get_containing_scope (parent))
6450 if (TREE_CODE (parent) == FUNCTION_DECL)
6451 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6454 /* We are now committed to emitting code for this function. Do any
6455 preparation, such as emitting abstract debug info for the inline
6456 before it gets mangled by optimization. */
6457 if (cgraph_function_possibly_inlined_p (current_function_decl))
6458 (*debug_hooks->outlining_inline_function) (current_function_decl);
6460 TREE_ASM_WRITTEN (current_function_decl) = 1;
6462 /* After expanding, the return labels are no longer needed. */
6463 return_label = NULL;
6464 naked_return_label = NULL;
6466 /* After expanding, the tm_restart map is no longer needed. */
6467 if (fun->gimple_df->tm_restart)
6468 fun->gimple_df->tm_restart = NULL;
6470 /* Tag the blocks with a depth number so that change_scope can find
6471 the common parent easily. */
6472 set_block_levels (DECL_INITIAL (fun->decl), 0);
6473 default_rtl_profile ();
6475 timevar_pop (TV_POST_EXPAND);
6477 return 0;
6480 } // anon namespace
6482 rtl_opt_pass *
6483 make_pass_expand (gcc::context *ctxt)
6485 return new pass_expand (ctxt);