[PR67891] don't test is_gimple_reg after parm expansion
[official-gcc.git] / gcc / cfgexpand.c
blobeaad859f513b6402566d9b41a73c140a7b45bcfa
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2015 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "cfghooks.h"
25 #include "tree.h"
26 #include "gimple.h"
27 #include "rtl.h"
28 #include "ssa.h"
29 #include "alias.h"
30 #include "fold-const.h"
31 #include "varasm.h"
32 #include "stor-layout.h"
33 #include "stmt.h"
34 #include "print-tree.h"
35 #include "tm_p.h"
36 #include "cfgrtl.h"
37 #include "cfganal.h"
38 #include "cfgbuild.h"
39 #include "cfgcleanup.h"
40 #include "insn-codes.h"
41 #include "optabs.h"
42 #include "flags.h"
43 #include "insn-config.h"
44 #include "expmed.h"
45 #include "dojump.h"
46 #include "explow.h"
47 #include "calls.h"
48 #include "emit-rtl.h"
49 #include "expr.h"
50 #include "langhooks.h"
51 #include "internal-fn.h"
52 #include "tree-eh.h"
53 #include "gimple-iterator.h"
54 #include "gimple-walk.h"
55 #include "cgraph.h"
56 #include "tree-cfg.h"
57 #include "tree-dfa.h"
58 #include "tree-ssa.h"
59 #include "tree-pass.h"
60 #include "except.h"
61 #include "diagnostic.h"
62 #include "gimple-pretty-print.h"
63 #include "toplev.h"
64 #include "debug.h"
65 #include "params.h"
66 #include "tree-inline.h"
67 #include "value-prof.h"
68 #include "target.h"
69 #include "tree-ssa-live.h"
70 #include "tree-outof-ssa.h"
71 #include "cfgloop.h"
72 #include "regs.h" /* For reg_renumber. */
73 #include "insn-attr.h" /* For INSN_SCHEDULING. */
74 #include "asan.h"
75 #include "tree-ssa-address.h"
76 #include "recog.h"
77 #include "output.h"
78 #include "builtins.h"
79 #include "tree-chkp.h"
80 #include "rtl-chkp.h"
82 /* Some systems use __main in a way incompatible with its use in gcc, in these
83 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
84 give the same symbol without quotes for an alternative entry point. You
85 must define both, or neither. */
86 #ifndef NAME__MAIN
87 #define NAME__MAIN "__main"
88 #endif
90 /* This variable holds information helping the rewriting of SSA trees
91 into RTL. */
92 struct ssaexpand SA;
94 /* This variable holds the currently expanded gimple statement for purposes
95 of comminucating the profile info to the builtin expanders. */
96 gimple *currently_expanding_gimple_stmt;
98 static rtx expand_debug_expr (tree);
100 static bool defer_stack_allocation (tree, bool);
102 static void record_alignment_for_reg_var (unsigned int);
104 /* Return an expression tree corresponding to the RHS of GIMPLE
105 statement STMT. */
107 tree
108 gimple_assign_rhs_to_tree (gimple *stmt)
110 tree t;
111 enum gimple_rhs_class grhs_class;
113 grhs_class = get_gimple_rhs_class (gimple_expr_code (stmt));
115 if (grhs_class == GIMPLE_TERNARY_RHS)
116 t = build3 (gimple_assign_rhs_code (stmt),
117 TREE_TYPE (gimple_assign_lhs (stmt)),
118 gimple_assign_rhs1 (stmt),
119 gimple_assign_rhs2 (stmt),
120 gimple_assign_rhs3 (stmt));
121 else if (grhs_class == GIMPLE_BINARY_RHS)
122 t = build2 (gimple_assign_rhs_code (stmt),
123 TREE_TYPE (gimple_assign_lhs (stmt)),
124 gimple_assign_rhs1 (stmt),
125 gimple_assign_rhs2 (stmt));
126 else if (grhs_class == GIMPLE_UNARY_RHS)
127 t = build1 (gimple_assign_rhs_code (stmt),
128 TREE_TYPE (gimple_assign_lhs (stmt)),
129 gimple_assign_rhs1 (stmt));
130 else if (grhs_class == GIMPLE_SINGLE_RHS)
132 t = gimple_assign_rhs1 (stmt);
133 /* Avoid modifying this tree in place below. */
134 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
135 && gimple_location (stmt) != EXPR_LOCATION (t))
136 || (gimple_block (stmt)
137 && currently_expanding_to_rtl
138 && EXPR_P (t)))
139 t = copy_node (t);
141 else
142 gcc_unreachable ();
144 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
145 SET_EXPR_LOCATION (t, gimple_location (stmt));
147 return t;
151 #ifndef STACK_ALIGNMENT_NEEDED
152 #define STACK_ALIGNMENT_NEEDED 1
153 #endif
155 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
157 /* Choose either CUR or NEXT as the leader DECL for a partition.
158 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
159 out of the same user variable being in multiple partitions (this is
160 less likely for compiler-introduced temps). */
162 static tree
163 leader_merge (tree cur, tree next)
165 if (cur == NULL || cur == next)
166 return next;
168 if (DECL_P (cur) && DECL_IGNORED_P (cur))
169 return cur;
171 if (DECL_P (next) && DECL_IGNORED_P (next))
172 return next;
174 return cur;
177 /* Associate declaration T with storage space X. If T is no
178 SSA name this is exactly SET_DECL_RTL, otherwise make the
179 partition of T associated with X. */
180 static inline void
181 set_rtl (tree t, rtx x)
183 gcc_checking_assert (!x
184 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
185 || (use_register_for_decl (t)
186 ? (REG_P (x)
187 || (GET_CODE (x) == CONCAT
188 && (REG_P (XEXP (x, 0))
189 || SUBREG_P (XEXP (x, 0)))
190 && (REG_P (XEXP (x, 1))
191 || SUBREG_P (XEXP (x, 1))))
192 || (GET_CODE (x) == PARALLEL
193 && SSAVAR (t)
194 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
195 && !flag_tree_coalesce_vars))
196 : (MEM_P (x) || x == pc_rtx
197 || (GET_CODE (x) == CONCAT
198 && MEM_P (XEXP (x, 0))
199 && MEM_P (XEXP (x, 1))))));
200 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
201 RESULT_DECLs has the expected mode. For memory, we accept
202 unpromoted modes, since that's what we're likely to get. For
203 PARM_DECLs and RESULT_DECLs, we'll have been called by
204 set_parm_rtl, which will give us the default def, so we don't
205 have to compute it ourselves. For RESULT_DECLs, we accept mode
206 mismatches too, as long as we're not coalescing across variables,
207 so that we don't reject BLKmode PARALLELs or unpromoted REGs. */
208 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
209 || (SSAVAR (t) && TREE_CODE (SSAVAR (t)) == RESULT_DECL
210 && !flag_tree_coalesce_vars)
211 || !use_register_for_decl (t)
212 || GET_MODE (x) == promote_ssa_mode (t, NULL));
214 if (x)
216 bool skip = false;
217 tree cur = NULL_TREE;
218 rtx xm = x;
220 retry:
221 if (MEM_P (xm))
222 cur = MEM_EXPR (xm);
223 else if (REG_P (xm))
224 cur = REG_EXPR (xm);
225 else if (SUBREG_P (xm))
227 gcc_assert (subreg_lowpart_p (xm));
228 xm = SUBREG_REG (xm);
229 goto retry;
231 else if (GET_CODE (xm) == CONCAT)
233 xm = XEXP (xm, 0);
234 goto retry;
236 else if (GET_CODE (xm) == PARALLEL)
238 xm = XVECEXP (xm, 0, 0);
239 gcc_assert (GET_CODE (xm) == EXPR_LIST);
240 xm = XEXP (xm, 0);
241 goto retry;
243 else if (xm == pc_rtx)
244 skip = true;
245 else
246 gcc_unreachable ();
248 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
250 if (cur != next)
252 if (MEM_P (x))
253 set_mem_attributes (x,
254 next && TREE_CODE (next) == SSA_NAME
255 ? TREE_TYPE (next)
256 : next, true);
257 else
258 set_reg_attrs_for_decl_rtl (next, x);
262 if (TREE_CODE (t) == SSA_NAME)
264 int part = var_to_partition (SA.map, t);
265 if (part != NO_PARTITION)
267 if (SA.partition_to_pseudo[part])
268 gcc_assert (SA.partition_to_pseudo[part] == x);
269 else if (x != pc_rtx)
270 SA.partition_to_pseudo[part] = x;
272 /* For the benefit of debug information at -O0 (where
273 vartracking doesn't run) record the place also in the base
274 DECL. For PARMs and RESULTs, do so only when setting the
275 default def. */
276 if (x && x != pc_rtx && SSA_NAME_VAR (t)
277 && (VAR_P (SSA_NAME_VAR (t))
278 || SSA_NAME_IS_DEFAULT_DEF (t)))
280 tree var = SSA_NAME_VAR (t);
281 /* If we don't yet have something recorded, just record it now. */
282 if (!DECL_RTL_SET_P (var))
283 SET_DECL_RTL (var, x);
284 /* If we have it set already to "multiple places" don't
285 change this. */
286 else if (DECL_RTL (var) == pc_rtx)
288 /* If we have something recorded and it's not the same place
289 as we want to record now, we have multiple partitions for the
290 same base variable, with different places. We can't just
291 randomly chose one, hence we have to say that we don't know.
292 This only happens with optimization, and there var-tracking
293 will figure out the right thing. */
294 else if (DECL_RTL (var) != x)
295 SET_DECL_RTL (var, pc_rtx);
298 else
299 SET_DECL_RTL (t, x);
302 /* This structure holds data relevant to one variable that will be
303 placed in a stack slot. */
304 struct stack_var
306 /* The Variable. */
307 tree decl;
309 /* Initially, the size of the variable. Later, the size of the partition,
310 if this variable becomes it's partition's representative. */
311 HOST_WIDE_INT size;
313 /* The *byte* alignment required for this variable. Or as, with the
314 size, the alignment for this partition. */
315 unsigned int alignb;
317 /* The partition representative. */
318 size_t representative;
320 /* The next stack variable in the partition, or EOC. */
321 size_t next;
323 /* The numbers of conflicting stack variables. */
324 bitmap conflicts;
327 #define EOC ((size_t)-1)
329 /* We have an array of such objects while deciding allocation. */
330 static struct stack_var *stack_vars;
331 static size_t stack_vars_alloc;
332 static size_t stack_vars_num;
333 static hash_map<tree, size_t> *decl_to_stack_part;
335 /* Conflict bitmaps go on this obstack. This allows us to destroy
336 all of them in one big sweep. */
337 static bitmap_obstack stack_var_bitmap_obstack;
339 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
340 is non-decreasing. */
341 static size_t *stack_vars_sorted;
343 /* The phase of the stack frame. This is the known misalignment of
344 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
345 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
346 static int frame_phase;
348 /* Used during expand_used_vars to remember if we saw any decls for
349 which we'd like to enable stack smashing protection. */
350 static bool has_protected_decls;
352 /* Used during expand_used_vars. Remember if we say a character buffer
353 smaller than our cutoff threshold. Used for -Wstack-protector. */
354 static bool has_short_buffer;
356 /* Compute the byte alignment to use for DECL. Ignore alignment
357 we can't do with expected alignment of the stack boundary. */
359 static unsigned int
360 align_local_variable (tree decl)
362 unsigned int align;
364 if (TREE_CODE (decl) == SSA_NAME)
365 align = TYPE_ALIGN (TREE_TYPE (decl));
366 else
368 align = LOCAL_DECL_ALIGNMENT (decl);
369 DECL_ALIGN (decl) = align;
371 return align / BITS_PER_UNIT;
374 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
375 down otherwise. Return truncated BASE value. */
377 static inline unsigned HOST_WIDE_INT
378 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
380 return align_up ? (base + align - 1) & -align : base & -align;
383 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
384 Return the frame offset. */
386 static HOST_WIDE_INT
387 alloc_stack_frame_space (HOST_WIDE_INT size, unsigned HOST_WIDE_INT align)
389 HOST_WIDE_INT offset, new_frame_offset;
391 if (FRAME_GROWS_DOWNWARD)
393 new_frame_offset
394 = align_base (frame_offset - frame_phase - size,
395 align, false) + frame_phase;
396 offset = new_frame_offset;
398 else
400 new_frame_offset
401 = align_base (frame_offset - frame_phase, align, true) + frame_phase;
402 offset = new_frame_offset;
403 new_frame_offset += size;
405 frame_offset = new_frame_offset;
407 if (frame_offset_overflow (frame_offset, cfun->decl))
408 frame_offset = offset = 0;
410 return offset;
413 /* Accumulate DECL into STACK_VARS. */
415 static void
416 add_stack_var (tree decl)
418 struct stack_var *v;
420 if (stack_vars_num >= stack_vars_alloc)
422 if (stack_vars_alloc)
423 stack_vars_alloc = stack_vars_alloc * 3 / 2;
424 else
425 stack_vars_alloc = 32;
426 stack_vars
427 = XRESIZEVEC (struct stack_var, stack_vars, stack_vars_alloc);
429 if (!decl_to_stack_part)
430 decl_to_stack_part = new hash_map<tree, size_t>;
432 v = &stack_vars[stack_vars_num];
433 decl_to_stack_part->put (decl, stack_vars_num);
435 v->decl = decl;
436 tree size = TREE_CODE (decl) == SSA_NAME
437 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
438 : DECL_SIZE_UNIT (decl);
439 v->size = tree_to_uhwi (size);
440 /* Ensure that all variables have size, so that &a != &b for any two
441 variables that are simultaneously live. */
442 if (v->size == 0)
443 v->size = 1;
444 v->alignb = align_local_variable (decl);
445 /* An alignment of zero can mightily confuse us later. */
446 gcc_assert (v->alignb != 0);
448 /* All variables are initially in their own partition. */
449 v->representative = stack_vars_num;
450 v->next = EOC;
452 /* All variables initially conflict with no other. */
453 v->conflicts = NULL;
455 /* Ensure that this decl doesn't get put onto the list twice. */
456 set_rtl (decl, pc_rtx);
458 stack_vars_num++;
461 /* Make the decls associated with luid's X and Y conflict. */
463 static void
464 add_stack_var_conflict (size_t x, size_t y)
466 struct stack_var *a = &stack_vars[x];
467 struct stack_var *b = &stack_vars[y];
468 if (!a->conflicts)
469 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
470 if (!b->conflicts)
471 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
472 bitmap_set_bit (a->conflicts, y);
473 bitmap_set_bit (b->conflicts, x);
476 /* Check whether the decls associated with luid's X and Y conflict. */
478 static bool
479 stack_var_conflict_p (size_t x, size_t y)
481 struct stack_var *a = &stack_vars[x];
482 struct stack_var *b = &stack_vars[y];
483 if (x == y)
484 return false;
485 /* Partitions containing an SSA name result from gimple registers
486 with things like unsupported modes. They are top-level and
487 hence conflict with everything else. */
488 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
489 return true;
491 if (!a->conflicts || !b->conflicts)
492 return false;
493 return bitmap_bit_p (a->conflicts, y);
496 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
497 enter its partition number into bitmap DATA. */
499 static bool
500 visit_op (gimple *, tree op, tree, void *data)
502 bitmap active = (bitmap)data;
503 op = get_base_address (op);
504 if (op
505 && DECL_P (op)
506 && DECL_RTL_IF_SET (op) == pc_rtx)
508 size_t *v = decl_to_stack_part->get (op);
509 if (v)
510 bitmap_set_bit (active, *v);
512 return false;
515 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
516 record conflicts between it and all currently active other partitions
517 from bitmap DATA. */
519 static bool
520 visit_conflict (gimple *, tree op, tree, void *data)
522 bitmap active = (bitmap)data;
523 op = get_base_address (op);
524 if (op
525 && DECL_P (op)
526 && DECL_RTL_IF_SET (op) == pc_rtx)
528 size_t *v = decl_to_stack_part->get (op);
529 if (v && bitmap_set_bit (active, *v))
531 size_t num = *v;
532 bitmap_iterator bi;
533 unsigned i;
534 gcc_assert (num < stack_vars_num);
535 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
536 add_stack_var_conflict (num, i);
539 return false;
542 /* Helper routine for add_scope_conflicts, calculating the active partitions
543 at the end of BB, leaving the result in WORK. We're called to generate
544 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
545 liveness. */
547 static void
548 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
550 edge e;
551 edge_iterator ei;
552 gimple_stmt_iterator gsi;
553 walk_stmt_load_store_addr_fn visit;
555 bitmap_clear (work);
556 FOR_EACH_EDGE (e, ei, bb->preds)
557 bitmap_ior_into (work, (bitmap)e->src->aux);
559 visit = visit_op;
561 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
563 gimple *stmt = gsi_stmt (gsi);
564 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
566 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
568 gimple *stmt = gsi_stmt (gsi);
570 if (gimple_clobber_p (stmt))
572 tree lhs = gimple_assign_lhs (stmt);
573 size_t *v;
574 /* Nested function lowering might introduce LHSs
575 that are COMPONENT_REFs. */
576 if (TREE_CODE (lhs) != VAR_DECL)
577 continue;
578 if (DECL_RTL_IF_SET (lhs) == pc_rtx
579 && (v = decl_to_stack_part->get (lhs)))
580 bitmap_clear_bit (work, *v);
582 else if (!is_gimple_debug (stmt))
584 if (for_conflict
585 && visit == visit_op)
587 /* If this is the first real instruction in this BB we need
588 to add conflicts for everything live at this point now.
589 Unlike classical liveness for named objects we can't
590 rely on seeing a def/use of the names we're interested in.
591 There might merely be indirect loads/stores. We'd not add any
592 conflicts for such partitions. */
593 bitmap_iterator bi;
594 unsigned i;
595 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
597 struct stack_var *a = &stack_vars[i];
598 if (!a->conflicts)
599 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
600 bitmap_ior_into (a->conflicts, work);
602 visit = visit_conflict;
604 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
609 /* Generate stack partition conflicts between all partitions that are
610 simultaneously live. */
612 static void
613 add_scope_conflicts (void)
615 basic_block bb;
616 bool changed;
617 bitmap work = BITMAP_ALLOC (NULL);
618 int *rpo;
619 int n_bbs;
621 /* We approximate the live range of a stack variable by taking the first
622 mention of its name as starting point(s), and by the end-of-scope
623 death clobber added by gimplify as ending point(s) of the range.
624 This overapproximates in the case we for instance moved an address-taken
625 operation upward, without also moving a dereference to it upwards.
626 But it's conservatively correct as a variable never can hold values
627 before its name is mentioned at least once.
629 We then do a mostly classical bitmap liveness algorithm. */
631 FOR_ALL_BB_FN (bb, cfun)
632 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
634 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
635 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
637 changed = true;
638 while (changed)
640 int i;
641 changed = false;
642 for (i = 0; i < n_bbs; i++)
644 bitmap active;
645 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
646 active = (bitmap)bb->aux;
647 add_scope_conflicts_1 (bb, work, false);
648 if (bitmap_ior_into (active, work))
649 changed = true;
653 FOR_EACH_BB_FN (bb, cfun)
654 add_scope_conflicts_1 (bb, work, true);
656 free (rpo);
657 BITMAP_FREE (work);
658 FOR_ALL_BB_FN (bb, cfun)
659 BITMAP_FREE (bb->aux);
662 /* A subroutine of partition_stack_vars. A comparison function for qsort,
663 sorting an array of indices by the properties of the object. */
665 static int
666 stack_var_cmp (const void *a, const void *b)
668 size_t ia = *(const size_t *)a;
669 size_t ib = *(const size_t *)b;
670 unsigned int aligna = stack_vars[ia].alignb;
671 unsigned int alignb = stack_vars[ib].alignb;
672 HOST_WIDE_INT sizea = stack_vars[ia].size;
673 HOST_WIDE_INT sizeb = stack_vars[ib].size;
674 tree decla = stack_vars[ia].decl;
675 tree declb = stack_vars[ib].decl;
676 bool largea, largeb;
677 unsigned int uida, uidb;
679 /* Primary compare on "large" alignment. Large comes first. */
680 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
681 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
682 if (largea != largeb)
683 return (int)largeb - (int)largea;
685 /* Secondary compare on size, decreasing */
686 if (sizea > sizeb)
687 return -1;
688 if (sizea < sizeb)
689 return 1;
691 /* Tertiary compare on true alignment, decreasing. */
692 if (aligna < alignb)
693 return -1;
694 if (aligna > alignb)
695 return 1;
697 /* Final compare on ID for sort stability, increasing.
698 Two SSA names are compared by their version, SSA names come before
699 non-SSA names, and two normal decls are compared by their DECL_UID. */
700 if (TREE_CODE (decla) == SSA_NAME)
702 if (TREE_CODE (declb) == SSA_NAME)
703 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
704 else
705 return -1;
707 else if (TREE_CODE (declb) == SSA_NAME)
708 return 1;
709 else
710 uida = DECL_UID (decla), uidb = DECL_UID (declb);
711 if (uida < uidb)
712 return 1;
713 if (uida > uidb)
714 return -1;
715 return 0;
718 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
719 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
721 /* If the points-to solution *PI points to variables that are in a partition
722 together with other variables add all partition members to the pointed-to
723 variables bitmap. */
725 static void
726 add_partitioned_vars_to_ptset (struct pt_solution *pt,
727 part_hashmap *decls_to_partitions,
728 hash_set<bitmap> *visited, bitmap temp)
730 bitmap_iterator bi;
731 unsigned i;
732 bitmap *part;
734 if (pt->anything
735 || pt->vars == NULL
736 /* The pointed-to vars bitmap is shared, it is enough to
737 visit it once. */
738 || visited->add (pt->vars))
739 return;
741 bitmap_clear (temp);
743 /* By using a temporary bitmap to store all members of the partitions
744 we have to add we make sure to visit each of the partitions only
745 once. */
746 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
747 if ((!temp
748 || !bitmap_bit_p (temp, i))
749 && (part = decls_to_partitions->get (i)))
750 bitmap_ior_into (temp, *part);
751 if (!bitmap_empty_p (temp))
752 bitmap_ior_into (pt->vars, temp);
755 /* Update points-to sets based on partition info, so we can use them on RTL.
756 The bitmaps representing stack partitions will be saved until expand,
757 where partitioned decls used as bases in memory expressions will be
758 rewritten. */
760 static void
761 update_alias_info_with_stack_vars (void)
763 part_hashmap *decls_to_partitions = NULL;
764 size_t i, j;
765 tree var = NULL_TREE;
767 for (i = 0; i < stack_vars_num; i++)
769 bitmap part = NULL;
770 tree name;
771 struct ptr_info_def *pi;
773 /* Not interested in partitions with single variable. */
774 if (stack_vars[i].representative != i
775 || stack_vars[i].next == EOC)
776 continue;
778 if (!decls_to_partitions)
780 decls_to_partitions = new part_hashmap;
781 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
784 /* Create an SSA_NAME that points to the partition for use
785 as base during alias-oracle queries on RTL for bases that
786 have been partitioned. */
787 if (var == NULL_TREE)
788 var = create_tmp_var (ptr_type_node);
789 name = make_ssa_name (var);
791 /* Create bitmaps representing partitions. They will be used for
792 points-to sets later, so use GGC alloc. */
793 part = BITMAP_GGC_ALLOC ();
794 for (j = i; j != EOC; j = stack_vars[j].next)
796 tree decl = stack_vars[j].decl;
797 unsigned int uid = DECL_PT_UID (decl);
798 bitmap_set_bit (part, uid);
799 decls_to_partitions->put (uid, part);
800 cfun->gimple_df->decls_to_pointers->put (decl, name);
801 if (TREE_ADDRESSABLE (decl))
802 TREE_ADDRESSABLE (name) = 1;
805 /* Make the SSA name point to all partition members. */
806 pi = get_ptr_info (name);
807 pt_solution_set (&pi->pt, part, false);
810 /* Make all points-to sets that contain one member of a partition
811 contain all members of the partition. */
812 if (decls_to_partitions)
814 unsigned i;
815 hash_set<bitmap> visited;
816 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
818 for (i = 1; i < num_ssa_names; i++)
820 tree name = ssa_name (i);
821 struct ptr_info_def *pi;
823 if (name
824 && POINTER_TYPE_P (TREE_TYPE (name))
825 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
826 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
827 &visited, temp);
830 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
831 decls_to_partitions, &visited, temp);
833 delete decls_to_partitions;
834 BITMAP_FREE (temp);
838 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
839 partitioning algorithm. Partitions A and B are known to be non-conflicting.
840 Merge them into a single partition A. */
842 static void
843 union_stack_vars (size_t a, size_t b)
845 struct stack_var *vb = &stack_vars[b];
846 bitmap_iterator bi;
847 unsigned u;
849 gcc_assert (stack_vars[b].next == EOC);
850 /* Add B to A's partition. */
851 stack_vars[b].next = stack_vars[a].next;
852 stack_vars[b].representative = a;
853 stack_vars[a].next = b;
855 /* Update the required alignment of partition A to account for B. */
856 if (stack_vars[a].alignb < stack_vars[b].alignb)
857 stack_vars[a].alignb = stack_vars[b].alignb;
859 /* Update the interference graph and merge the conflicts. */
860 if (vb->conflicts)
862 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
863 add_stack_var_conflict (a, stack_vars[u].representative);
864 BITMAP_FREE (vb->conflicts);
868 /* A subroutine of expand_used_vars. Binpack the variables into
869 partitions constrained by the interference graph. The overall
870 algorithm used is as follows:
872 Sort the objects by size in descending order.
873 For each object A {
874 S = size(A)
875 O = 0
876 loop {
877 Look for the largest non-conflicting object B with size <= S.
878 UNION (A, B)
883 static void
884 partition_stack_vars (void)
886 size_t si, sj, n = stack_vars_num;
888 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
889 for (si = 0; si < n; ++si)
890 stack_vars_sorted[si] = si;
892 if (n == 1)
893 return;
895 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
897 for (si = 0; si < n; ++si)
899 size_t i = stack_vars_sorted[si];
900 unsigned int ialign = stack_vars[i].alignb;
901 HOST_WIDE_INT isize = stack_vars[i].size;
903 /* Ignore objects that aren't partition representatives. If we
904 see a var that is not a partition representative, it must
905 have been merged earlier. */
906 if (stack_vars[i].representative != i)
907 continue;
909 for (sj = si + 1; sj < n; ++sj)
911 size_t j = stack_vars_sorted[sj];
912 unsigned int jalign = stack_vars[j].alignb;
913 HOST_WIDE_INT jsize = stack_vars[j].size;
915 /* Ignore objects that aren't partition representatives. */
916 if (stack_vars[j].representative != j)
917 continue;
919 /* Do not mix objects of "small" (supported) alignment
920 and "large" (unsupported) alignment. */
921 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
922 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
923 break;
925 /* For Address Sanitizer do not mix objects with different
926 sizes, as the shorter vars wouldn't be adequately protected.
927 Don't do that for "large" (unsupported) alignment objects,
928 those aren't protected anyway. */
929 if ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK && isize != jsize
930 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
931 break;
933 /* Ignore conflicting objects. */
934 if (stack_var_conflict_p (i, j))
935 continue;
937 /* UNION the objects, placing J at OFFSET. */
938 union_stack_vars (i, j);
942 update_alias_info_with_stack_vars ();
945 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
947 static void
948 dump_stack_var_partition (void)
950 size_t si, i, j, n = stack_vars_num;
952 for (si = 0; si < n; ++si)
954 i = stack_vars_sorted[si];
956 /* Skip variables that aren't partition representatives, for now. */
957 if (stack_vars[i].representative != i)
958 continue;
960 fprintf (dump_file, "Partition %lu: size " HOST_WIDE_INT_PRINT_DEC
961 " align %u\n", (unsigned long) i, stack_vars[i].size,
962 stack_vars[i].alignb);
964 for (j = i; j != EOC; j = stack_vars[j].next)
966 fputc ('\t', dump_file);
967 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
969 fputc ('\n', dump_file);
973 /* Assign rtl to DECL at BASE + OFFSET. */
975 static void
976 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
977 HOST_WIDE_INT offset)
979 unsigned align;
980 rtx x;
982 /* If this fails, we've overflowed the stack frame. Error nicely? */
983 gcc_assert (offset == trunc_int_for_mode (offset, Pmode));
985 x = plus_constant (Pmode, base, offset);
986 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
987 ? TYPE_MODE (TREE_TYPE (decl))
988 : DECL_MODE (SSAVAR (decl)), x);
990 if (TREE_CODE (decl) != SSA_NAME)
992 /* Set alignment we actually gave this decl if it isn't an SSA name.
993 If it is we generate stack slots only accidentally so it isn't as
994 important, we'll simply use the alignment that is already set. */
995 if (base == virtual_stack_vars_rtx)
996 offset -= frame_phase;
997 align = offset & -offset;
998 align *= BITS_PER_UNIT;
999 if (align == 0 || align > base_align)
1000 align = base_align;
1002 /* One would think that we could assert that we're not decreasing
1003 alignment here, but (at least) the i386 port does exactly this
1004 via the MINIMUM_ALIGNMENT hook. */
1006 DECL_ALIGN (decl) = align;
1007 DECL_USER_ALIGN (decl) = 0;
1010 set_rtl (decl, x);
1013 struct stack_vars_data
1015 /* Vector of offset pairs, always end of some padding followed
1016 by start of the padding that needs Address Sanitizer protection.
1017 The vector is in reversed, highest offset pairs come first. */
1018 vec<HOST_WIDE_INT> asan_vec;
1020 /* Vector of partition representative decls in between the paddings. */
1021 vec<tree> asan_decl_vec;
1023 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1024 rtx asan_base;
1026 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1027 unsigned int asan_alignb;
1030 /* A subroutine of expand_used_vars. Give each partition representative
1031 a unique location within the stack frame. Update each partition member
1032 with that location. */
1034 static void
1035 expand_stack_vars (bool (*pred) (size_t), struct stack_vars_data *data)
1037 size_t si, i, j, n = stack_vars_num;
1038 HOST_WIDE_INT large_size = 0, large_alloc = 0;
1039 rtx large_base = NULL;
1040 unsigned large_align = 0;
1041 tree decl;
1043 /* Determine if there are any variables requiring "large" alignment.
1044 Since these are dynamically allocated, we only process these if
1045 no predicate involved. */
1046 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1047 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1049 /* Find the total size of these variables. */
1050 for (si = 0; si < n; ++si)
1052 unsigned alignb;
1054 i = stack_vars_sorted[si];
1055 alignb = stack_vars[i].alignb;
1057 /* All "large" alignment decls come before all "small" alignment
1058 decls, but "large" alignment decls are not sorted based on
1059 their alignment. Increase large_align to track the largest
1060 required alignment. */
1061 if ((alignb * BITS_PER_UNIT) > large_align)
1062 large_align = alignb * BITS_PER_UNIT;
1064 /* Stop when we get to the first decl with "small" alignment. */
1065 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1066 break;
1068 /* Skip variables that aren't partition representatives. */
1069 if (stack_vars[i].representative != i)
1070 continue;
1072 /* Skip variables that have already had rtl assigned. See also
1073 add_stack_var where we perpetrate this pc_rtx hack. */
1074 decl = stack_vars[i].decl;
1075 if (TREE_CODE (decl) == SSA_NAME
1076 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1077 : DECL_RTL (decl) != pc_rtx)
1078 continue;
1080 large_size += alignb - 1;
1081 large_size &= -(HOST_WIDE_INT)alignb;
1082 large_size += stack_vars[i].size;
1085 /* If there were any, allocate space. */
1086 if (large_size > 0)
1087 large_base = allocate_dynamic_stack_space (GEN_INT (large_size), 0,
1088 large_align, true);
1091 for (si = 0; si < n; ++si)
1093 rtx base;
1094 unsigned base_align, alignb;
1095 HOST_WIDE_INT offset;
1097 i = stack_vars_sorted[si];
1099 /* Skip variables that aren't partition representatives, for now. */
1100 if (stack_vars[i].representative != i)
1101 continue;
1103 /* Skip variables that have already had rtl assigned. See also
1104 add_stack_var where we perpetrate this pc_rtx hack. */
1105 decl = stack_vars[i].decl;
1106 if (TREE_CODE (decl) == SSA_NAME
1107 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1108 : DECL_RTL (decl) != pc_rtx)
1109 continue;
1111 /* Check the predicate to see whether this variable should be
1112 allocated in this pass. */
1113 if (pred && !pred (i))
1114 continue;
1116 alignb = stack_vars[i].alignb;
1117 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1119 base = virtual_stack_vars_rtx;
1120 if ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK && pred)
1122 HOST_WIDE_INT prev_offset
1123 = align_base (frame_offset,
1124 MAX (alignb, ASAN_RED_ZONE_SIZE),
1125 FRAME_GROWS_DOWNWARD);
1126 tree repr_decl = NULL_TREE;
1127 offset
1128 = alloc_stack_frame_space (stack_vars[i].size
1129 + ASAN_RED_ZONE_SIZE,
1130 MAX (alignb, ASAN_RED_ZONE_SIZE));
1132 data->asan_vec.safe_push (prev_offset);
1133 data->asan_vec.safe_push (offset + stack_vars[i].size);
1134 /* Find best representative of the partition.
1135 Prefer those with DECL_NAME, even better
1136 satisfying asan_protect_stack_decl predicate. */
1137 for (j = i; j != EOC; j = stack_vars[j].next)
1138 if (asan_protect_stack_decl (stack_vars[j].decl)
1139 && DECL_NAME (stack_vars[j].decl))
1141 repr_decl = stack_vars[j].decl;
1142 break;
1144 else if (repr_decl == NULL_TREE
1145 && DECL_P (stack_vars[j].decl)
1146 && DECL_NAME (stack_vars[j].decl))
1147 repr_decl = stack_vars[j].decl;
1148 if (repr_decl == NULL_TREE)
1149 repr_decl = stack_vars[i].decl;
1150 data->asan_decl_vec.safe_push (repr_decl);
1151 data->asan_alignb = MAX (data->asan_alignb, alignb);
1152 if (data->asan_base == NULL)
1153 data->asan_base = gen_reg_rtx (Pmode);
1154 base = data->asan_base;
1156 if (!STRICT_ALIGNMENT)
1157 base_align = crtl->max_used_stack_slot_alignment;
1158 else
1159 base_align = MAX (crtl->max_used_stack_slot_alignment,
1160 GET_MODE_ALIGNMENT (SImode)
1161 << ASAN_SHADOW_SHIFT);
1163 else
1165 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1166 base_align = crtl->max_used_stack_slot_alignment;
1169 else
1171 /* Large alignment is only processed in the last pass. */
1172 if (pred)
1173 continue;
1174 gcc_assert (large_base != NULL);
1176 large_alloc += alignb - 1;
1177 large_alloc &= -(HOST_WIDE_INT)alignb;
1178 offset = large_alloc;
1179 large_alloc += stack_vars[i].size;
1181 base = large_base;
1182 base_align = large_align;
1185 /* Create rtl for each variable based on their location within the
1186 partition. */
1187 for (j = i; j != EOC; j = stack_vars[j].next)
1189 expand_one_stack_var_at (stack_vars[j].decl,
1190 base, base_align,
1191 offset);
1195 gcc_assert (large_alloc == large_size);
1198 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1199 static HOST_WIDE_INT
1200 account_stack_vars (void)
1202 size_t si, j, i, n = stack_vars_num;
1203 HOST_WIDE_INT size = 0;
1205 for (si = 0; si < n; ++si)
1207 i = stack_vars_sorted[si];
1209 /* Skip variables that aren't partition representatives, for now. */
1210 if (stack_vars[i].representative != i)
1211 continue;
1213 size += stack_vars[i].size;
1214 for (j = i; j != EOC; j = stack_vars[j].next)
1215 set_rtl (stack_vars[j].decl, NULL);
1217 return size;
1220 /* Record the RTL assignment X for the default def of PARM. */
1222 extern void
1223 set_parm_rtl (tree parm, rtx x)
1225 gcc_assert (TREE_CODE (parm) == PARM_DECL
1226 || TREE_CODE (parm) == RESULT_DECL);
1228 if (x && !MEM_P (x))
1230 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1231 TYPE_MODE (TREE_TYPE (parm)),
1232 TYPE_ALIGN (TREE_TYPE (parm)));
1234 /* If the variable alignment is very large we'll dynamicaly
1235 allocate it, which means that in-frame portion is just a
1236 pointer. ??? We've got a pseudo for sure here, do we
1237 actually dynamically allocate its spilling area if needed?
1238 ??? Isn't it a problem when POINTER_SIZE also exceeds
1239 MAX_SUPPORTED_STACK_ALIGNMENT, as on cris and lm32? */
1240 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1241 align = POINTER_SIZE;
1243 record_alignment_for_reg_var (align);
1246 tree ssa = ssa_default_def (cfun, parm);
1247 if (!ssa)
1248 return set_rtl (parm, x);
1250 int part = var_to_partition (SA.map, ssa);
1251 gcc_assert (part != NO_PARTITION);
1253 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1254 gcc_assert (changed);
1256 set_rtl (ssa, x);
1257 gcc_assert (DECL_RTL (parm) == x);
1260 /* A subroutine of expand_one_var. Called to immediately assign rtl
1261 to a variable to be allocated in the stack frame. */
1263 static void
1264 expand_one_stack_var_1 (tree var)
1266 HOST_WIDE_INT size, offset;
1267 unsigned byte_align;
1269 if (TREE_CODE (var) == SSA_NAME)
1271 tree type = TREE_TYPE (var);
1272 size = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1273 byte_align = TYPE_ALIGN_UNIT (type);
1275 else
1277 size = tree_to_uhwi (DECL_SIZE_UNIT (var));
1278 byte_align = align_local_variable (var);
1281 /* We handle highly aligned variables in expand_stack_vars. */
1282 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1284 offset = alloc_stack_frame_space (size, byte_align);
1286 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1287 crtl->max_used_stack_slot_alignment, offset);
1290 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1291 already assigned some MEM. */
1293 static void
1294 expand_one_stack_var (tree var)
1296 if (TREE_CODE (var) == SSA_NAME)
1298 int part = var_to_partition (SA.map, var);
1299 if (part != NO_PARTITION)
1301 rtx x = SA.partition_to_pseudo[part];
1302 gcc_assert (x);
1303 gcc_assert (MEM_P (x));
1304 return;
1308 return expand_one_stack_var_1 (var);
1311 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1312 that will reside in a hard register. */
1314 static void
1315 expand_one_hard_reg_var (tree var)
1317 rest_of_decl_compilation (var, 0, 0);
1320 /* Record the alignment requirements of some variable assigned to a
1321 pseudo. */
1323 static void
1324 record_alignment_for_reg_var (unsigned int align)
1326 if (SUPPORTS_STACK_ALIGNMENT
1327 && crtl->stack_alignment_estimated < align)
1329 /* stack_alignment_estimated shouldn't change after stack
1330 realign decision made */
1331 gcc_assert (!crtl->stack_realign_processed);
1332 crtl->stack_alignment_estimated = align;
1335 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1336 So here we only make sure stack_alignment_needed >= align. */
1337 if (crtl->stack_alignment_needed < align)
1338 crtl->stack_alignment_needed = align;
1339 if (crtl->max_used_stack_slot_alignment < align)
1340 crtl->max_used_stack_slot_alignment = align;
1343 /* Create RTL for an SSA partition. */
1345 static void
1346 expand_one_ssa_partition (tree var)
1348 int part = var_to_partition (SA.map, var);
1349 gcc_assert (part != NO_PARTITION);
1351 if (SA.partition_to_pseudo[part])
1352 return;
1354 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1355 TYPE_MODE (TREE_TYPE (var)),
1356 TYPE_ALIGN (TREE_TYPE (var)));
1358 /* If the variable alignment is very large we'll dynamicaly allocate
1359 it, which means that in-frame portion is just a pointer. */
1360 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1361 align = POINTER_SIZE;
1363 record_alignment_for_reg_var (align);
1365 if (!use_register_for_decl (var))
1367 if (defer_stack_allocation (var, true))
1368 add_stack_var (var);
1369 else
1370 expand_one_stack_var_1 (var);
1371 return;
1374 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1376 rtx x = gen_reg_rtx (reg_mode);
1378 set_rtl (var, x);
1381 /* Record the association between the RTL generated for partition PART
1382 and the underlying variable of the SSA_NAME VAR. */
1384 static void
1385 adjust_one_expanded_partition_var (tree var)
1387 if (!var)
1388 return;
1390 tree decl = SSA_NAME_VAR (var);
1392 int part = var_to_partition (SA.map, var);
1393 if (part == NO_PARTITION)
1394 return;
1396 rtx x = SA.partition_to_pseudo[part];
1398 gcc_assert (x);
1400 set_rtl (var, x);
1402 if (!REG_P (x))
1403 return;
1405 /* Note if the object is a user variable. */
1406 if (decl && !DECL_ARTIFICIAL (decl))
1407 mark_user_reg (x);
1409 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1410 mark_reg_pointer (x, get_pointer_alignment (var));
1413 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1414 that will reside in a pseudo register. */
1416 static void
1417 expand_one_register_var (tree var)
1419 if (TREE_CODE (var) == SSA_NAME)
1421 int part = var_to_partition (SA.map, var);
1422 if (part != NO_PARTITION)
1424 rtx x = SA.partition_to_pseudo[part];
1425 gcc_assert (x);
1426 gcc_assert (REG_P (x));
1427 return;
1429 gcc_unreachable ();
1432 tree decl = var;
1433 tree type = TREE_TYPE (decl);
1434 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1435 rtx x = gen_reg_rtx (reg_mode);
1437 set_rtl (var, x);
1439 /* Note if the object is a user variable. */
1440 if (!DECL_ARTIFICIAL (decl))
1441 mark_user_reg (x);
1443 if (POINTER_TYPE_P (type))
1444 mark_reg_pointer (x, get_pointer_alignment (var));
1447 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1448 has some associated error, e.g. its type is error-mark. We just need
1449 to pick something that won't crash the rest of the compiler. */
1451 static void
1452 expand_one_error_var (tree var)
1454 machine_mode mode = DECL_MODE (var);
1455 rtx x;
1457 if (mode == BLKmode)
1458 x = gen_rtx_MEM (BLKmode, const0_rtx);
1459 else if (mode == VOIDmode)
1460 x = const0_rtx;
1461 else
1462 x = gen_reg_rtx (mode);
1464 SET_DECL_RTL (var, x);
1467 /* A subroutine of expand_one_var. VAR is a variable that will be
1468 allocated to the local stack frame. Return true if we wish to
1469 add VAR to STACK_VARS so that it will be coalesced with other
1470 variables. Return false to allocate VAR immediately.
1472 This function is used to reduce the number of variables considered
1473 for coalescing, which reduces the size of the quadratic problem. */
1475 static bool
1476 defer_stack_allocation (tree var, bool toplevel)
1478 tree size_unit = TREE_CODE (var) == SSA_NAME
1479 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1480 : DECL_SIZE_UNIT (var);
1482 /* Whether the variable is small enough for immediate allocation not to be
1483 a problem with regard to the frame size. */
1484 bool smallish
1485 = ((HOST_WIDE_INT) tree_to_uhwi (size_unit)
1486 < PARAM_VALUE (PARAM_MIN_SIZE_FOR_STACK_SHARING));
1488 /* If stack protection is enabled, *all* stack variables must be deferred,
1489 so that we can re-order the strings to the top of the frame.
1490 Similarly for Address Sanitizer. */
1491 if (flag_stack_protect || ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK))
1492 return true;
1494 unsigned int align = TREE_CODE (var) == SSA_NAME
1495 ? TYPE_ALIGN (TREE_TYPE (var))
1496 : DECL_ALIGN (var);
1498 /* We handle "large" alignment via dynamic allocation. We want to handle
1499 this extra complication in only one place, so defer them. */
1500 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1501 return true;
1503 bool ignored = TREE_CODE (var) == SSA_NAME
1504 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1505 : DECL_IGNORED_P (var);
1507 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1508 might be detached from their block and appear at toplevel when we reach
1509 here. We want to coalesce them with variables from other blocks when
1510 the immediate contribution to the frame size would be noticeable. */
1511 if (toplevel && optimize > 0 && ignored && !smallish)
1512 return true;
1514 /* Variables declared in the outermost scope automatically conflict
1515 with every other variable. The only reason to want to defer them
1516 at all is that, after sorting, we can more efficiently pack
1517 small variables in the stack frame. Continue to defer at -O2. */
1518 if (toplevel && optimize < 2)
1519 return false;
1521 /* Without optimization, *most* variables are allocated from the
1522 stack, which makes the quadratic problem large exactly when we
1523 want compilation to proceed as quickly as possible. On the
1524 other hand, we don't want the function's stack frame size to
1525 get completely out of hand. So we avoid adding scalars and
1526 "small" aggregates to the list at all. */
1527 if (optimize == 0 && smallish)
1528 return false;
1530 return true;
1533 /* A subroutine of expand_used_vars. Expand one variable according to
1534 its flavor. Variables to be placed on the stack are not actually
1535 expanded yet, merely recorded.
1536 When REALLY_EXPAND is false, only add stack values to be allocated.
1537 Return stack usage this variable is supposed to take.
1540 static HOST_WIDE_INT
1541 expand_one_var (tree var, bool toplevel, bool really_expand)
1543 unsigned int align = BITS_PER_UNIT;
1544 tree origvar = var;
1546 var = SSAVAR (var);
1548 if (TREE_TYPE (var) != error_mark_node && TREE_CODE (var) == VAR_DECL)
1550 /* Because we don't know if VAR will be in register or on stack,
1551 we conservatively assume it will be on stack even if VAR is
1552 eventually put into register after RA pass. For non-automatic
1553 variables, which won't be on stack, we collect alignment of
1554 type and ignore user specified alignment. Similarly for
1555 SSA_NAMEs for which use_register_for_decl returns true. */
1556 if (TREE_STATIC (var)
1557 || DECL_EXTERNAL (var)
1558 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1559 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1560 TYPE_MODE (TREE_TYPE (var)),
1561 TYPE_ALIGN (TREE_TYPE (var)));
1562 else if (DECL_HAS_VALUE_EXPR_P (var)
1563 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1564 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1565 or variables which were assigned a stack slot already by
1566 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1567 changed from the offset chosen to it. */
1568 align = crtl->stack_alignment_estimated;
1569 else
1570 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1572 /* If the variable alignment is very large we'll dynamicaly allocate
1573 it, which means that in-frame portion is just a pointer. */
1574 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1575 align = POINTER_SIZE;
1578 record_alignment_for_reg_var (align);
1580 if (TREE_CODE (origvar) == SSA_NAME)
1582 gcc_assert (TREE_CODE (var) != VAR_DECL
1583 || (!DECL_EXTERNAL (var)
1584 && !DECL_HAS_VALUE_EXPR_P (var)
1585 && !TREE_STATIC (var)
1586 && TREE_TYPE (var) != error_mark_node
1587 && !DECL_HARD_REGISTER (var)
1588 && really_expand));
1590 if (TREE_CODE (var) != VAR_DECL && TREE_CODE (origvar) != SSA_NAME)
1592 else if (DECL_EXTERNAL (var))
1594 else if (DECL_HAS_VALUE_EXPR_P (var))
1596 else if (TREE_STATIC (var))
1598 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1600 else if (TREE_TYPE (var) == error_mark_node)
1602 if (really_expand)
1603 expand_one_error_var (var);
1605 else if (TREE_CODE (var) == VAR_DECL && DECL_HARD_REGISTER (var))
1607 if (really_expand)
1609 expand_one_hard_reg_var (var);
1610 if (!DECL_HARD_REGISTER (var))
1611 /* Invalid register specification. */
1612 expand_one_error_var (var);
1615 else if (use_register_for_decl (var))
1617 if (really_expand)
1618 expand_one_register_var (origvar);
1620 else if (! valid_constant_size_p (DECL_SIZE_UNIT (var)))
1622 /* Reject variables which cover more than half of the address-space. */
1623 if (really_expand)
1625 error ("size of variable %q+D is too large", var);
1626 expand_one_error_var (var);
1629 else if (defer_stack_allocation (var, toplevel))
1630 add_stack_var (origvar);
1631 else
1633 if (really_expand)
1635 if (lookup_attribute ("naked",
1636 DECL_ATTRIBUTES (current_function_decl)))
1637 error ("cannot allocate stack for variable %q+D, naked function.",
1638 var);
1640 expand_one_stack_var (origvar);
1644 return tree_to_uhwi (DECL_SIZE_UNIT (var));
1646 return 0;
1649 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1650 expanding variables. Those variables that can be put into registers
1651 are allocated pseudos; those that can't are put on the stack.
1653 TOPLEVEL is true if this is the outermost BLOCK. */
1655 static void
1656 expand_used_vars_for_block (tree block, bool toplevel)
1658 tree t;
1660 /* Expand all variables at this level. */
1661 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1662 if (TREE_USED (t)
1663 && ((TREE_CODE (t) != VAR_DECL && TREE_CODE (t) != RESULT_DECL)
1664 || !DECL_NONSHAREABLE (t)))
1665 expand_one_var (t, toplevel, true);
1667 /* Expand all variables at containing levels. */
1668 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1669 expand_used_vars_for_block (t, false);
1672 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1673 and clear TREE_USED on all local variables. */
1675 static void
1676 clear_tree_used (tree block)
1678 tree t;
1680 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1681 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1682 if ((TREE_CODE (t) != VAR_DECL && TREE_CODE (t) != RESULT_DECL)
1683 || !DECL_NONSHAREABLE (t))
1684 TREE_USED (t) = 0;
1686 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1687 clear_tree_used (t);
1690 enum {
1691 SPCT_FLAG_DEFAULT = 1,
1692 SPCT_FLAG_ALL = 2,
1693 SPCT_FLAG_STRONG = 3,
1694 SPCT_FLAG_EXPLICIT = 4
1697 /* Examine TYPE and determine a bit mask of the following features. */
1699 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1700 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1701 #define SPCT_HAS_ARRAY 4
1702 #define SPCT_HAS_AGGREGATE 8
1704 static unsigned int
1705 stack_protect_classify_type (tree type)
1707 unsigned int ret = 0;
1708 tree t;
1710 switch (TREE_CODE (type))
1712 case ARRAY_TYPE:
1713 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1714 if (t == char_type_node
1715 || t == signed_char_type_node
1716 || t == unsigned_char_type_node)
1718 unsigned HOST_WIDE_INT max = PARAM_VALUE (PARAM_SSP_BUFFER_SIZE);
1719 unsigned HOST_WIDE_INT len;
1721 if (!TYPE_SIZE_UNIT (type)
1722 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1723 len = max;
1724 else
1725 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1727 if (len < max)
1728 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1729 else
1730 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1732 else
1733 ret = SPCT_HAS_ARRAY;
1734 break;
1736 case UNION_TYPE:
1737 case QUAL_UNION_TYPE:
1738 case RECORD_TYPE:
1739 ret = SPCT_HAS_AGGREGATE;
1740 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1741 if (TREE_CODE (t) == FIELD_DECL)
1742 ret |= stack_protect_classify_type (TREE_TYPE (t));
1743 break;
1745 default:
1746 break;
1749 return ret;
1752 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1753 part of the local stack frame. Remember if we ever return nonzero for
1754 any variable in this function. The return value is the phase number in
1755 which the variable should be allocated. */
1757 static int
1758 stack_protect_decl_phase (tree decl)
1760 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1761 int ret = 0;
1763 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1764 has_short_buffer = true;
1766 if (flag_stack_protect == SPCT_FLAG_ALL
1767 || flag_stack_protect == SPCT_FLAG_STRONG
1768 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1769 && lookup_attribute ("stack_protect",
1770 DECL_ATTRIBUTES (current_function_decl))))
1772 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1773 && !(bits & SPCT_HAS_AGGREGATE))
1774 ret = 1;
1775 else if (bits & SPCT_HAS_ARRAY)
1776 ret = 2;
1778 else
1779 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1781 if (ret)
1782 has_protected_decls = true;
1784 return ret;
1787 /* Two helper routines that check for phase 1 and phase 2. These are used
1788 as callbacks for expand_stack_vars. */
1790 static bool
1791 stack_protect_decl_phase_1 (size_t i)
1793 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1796 static bool
1797 stack_protect_decl_phase_2 (size_t i)
1799 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1802 /* And helper function that checks for asan phase (with stack protector
1803 it is phase 3). This is used as callback for expand_stack_vars.
1804 Returns true if any of the vars in the partition need to be protected. */
1806 static bool
1807 asan_decl_phase_3 (size_t i)
1809 while (i != EOC)
1811 if (asan_protect_stack_decl (stack_vars[i].decl))
1812 return true;
1813 i = stack_vars[i].next;
1815 return false;
1818 /* Ensure that variables in different stack protection phases conflict
1819 so that they are not merged and share the same stack slot. */
1821 static void
1822 add_stack_protection_conflicts (void)
1824 size_t i, j, n = stack_vars_num;
1825 unsigned char *phase;
1827 phase = XNEWVEC (unsigned char, n);
1828 for (i = 0; i < n; ++i)
1829 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1831 for (i = 0; i < n; ++i)
1833 unsigned char ph_i = phase[i];
1834 for (j = i + 1; j < n; ++j)
1835 if (ph_i != phase[j])
1836 add_stack_var_conflict (i, j);
1839 XDELETEVEC (phase);
1842 /* Create a decl for the guard at the top of the stack frame. */
1844 static void
1845 create_stack_guard (void)
1847 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1848 VAR_DECL, NULL, ptr_type_node);
1849 TREE_THIS_VOLATILE (guard) = 1;
1850 TREE_USED (guard) = 1;
1851 expand_one_stack_var (guard);
1852 crtl->stack_protect_guard = guard;
1855 /* Prepare for expanding variables. */
1856 static void
1857 init_vars_expansion (void)
1859 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1860 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1862 /* A map from decl to stack partition. */
1863 decl_to_stack_part = new hash_map<tree, size_t>;
1865 /* Initialize local stack smashing state. */
1866 has_protected_decls = false;
1867 has_short_buffer = false;
1870 /* Free up stack variable graph data. */
1871 static void
1872 fini_vars_expansion (void)
1874 bitmap_obstack_release (&stack_var_bitmap_obstack);
1875 if (stack_vars)
1876 XDELETEVEC (stack_vars);
1877 if (stack_vars_sorted)
1878 XDELETEVEC (stack_vars_sorted);
1879 stack_vars = NULL;
1880 stack_vars_sorted = NULL;
1881 stack_vars_alloc = stack_vars_num = 0;
1882 delete decl_to_stack_part;
1883 decl_to_stack_part = NULL;
1886 /* Make a fair guess for the size of the stack frame of the function
1887 in NODE. This doesn't have to be exact, the result is only used in
1888 the inline heuristics. So we don't want to run the full stack var
1889 packing algorithm (which is quadratic in the number of stack vars).
1890 Instead, we calculate the total size of all stack vars. This turns
1891 out to be a pretty fair estimate -- packing of stack vars doesn't
1892 happen very often. */
1894 HOST_WIDE_INT
1895 estimated_stack_frame_size (struct cgraph_node *node)
1897 HOST_WIDE_INT size = 0;
1898 size_t i;
1899 tree var;
1900 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1902 push_cfun (fn);
1904 init_vars_expansion ();
1906 FOR_EACH_LOCAL_DECL (fn, i, var)
1907 if (auto_var_in_fn_p (var, fn->decl))
1908 size += expand_one_var (var, true, false);
1910 if (stack_vars_num > 0)
1912 /* Fake sorting the stack vars for account_stack_vars (). */
1913 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1914 for (i = 0; i < stack_vars_num; ++i)
1915 stack_vars_sorted[i] = i;
1916 size += account_stack_vars ();
1919 fini_vars_expansion ();
1920 pop_cfun ();
1921 return size;
1924 /* Helper routine to check if a record or union contains an array field. */
1926 static int
1927 record_or_union_type_has_array_p (const_tree tree_type)
1929 tree fields = TYPE_FIELDS (tree_type);
1930 tree f;
1932 for (f = fields; f; f = DECL_CHAIN (f))
1933 if (TREE_CODE (f) == FIELD_DECL)
1935 tree field_type = TREE_TYPE (f);
1936 if (RECORD_OR_UNION_TYPE_P (field_type)
1937 && record_or_union_type_has_array_p (field_type))
1938 return 1;
1939 if (TREE_CODE (field_type) == ARRAY_TYPE)
1940 return 1;
1942 return 0;
1945 /* Check if the current function has local referenced variables that
1946 have their addresses taken, contain an array, or are arrays. */
1948 static bool
1949 stack_protect_decl_p ()
1951 unsigned i;
1952 tree var;
1954 FOR_EACH_LOCAL_DECL (cfun, i, var)
1955 if (!is_global_var (var))
1957 tree var_type = TREE_TYPE (var);
1958 if (TREE_CODE (var) == VAR_DECL
1959 && (TREE_CODE (var_type) == ARRAY_TYPE
1960 || TREE_ADDRESSABLE (var)
1961 || (RECORD_OR_UNION_TYPE_P (var_type)
1962 && record_or_union_type_has_array_p (var_type))))
1963 return true;
1965 return false;
1968 /* Check if the current function has calls that use a return slot. */
1970 static bool
1971 stack_protect_return_slot_p ()
1973 basic_block bb;
1975 FOR_ALL_BB_FN (bb, cfun)
1976 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
1977 !gsi_end_p (gsi); gsi_next (&gsi))
1979 gimple *stmt = gsi_stmt (gsi);
1980 /* This assumes that calls to internal-only functions never
1981 use a return slot. */
1982 if (is_gimple_call (stmt)
1983 && !gimple_call_internal_p (stmt)
1984 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
1985 gimple_call_fndecl (stmt)))
1986 return true;
1988 return false;
1991 /* Expand all variables used in the function. */
1993 static rtx_insn *
1994 expand_used_vars (void)
1996 tree var, outer_block = DECL_INITIAL (current_function_decl);
1997 vec<tree> maybe_local_decls = vNULL;
1998 rtx_insn *var_end_seq = NULL;
1999 unsigned i;
2000 unsigned len;
2001 bool gen_stack_protect_signal = false;
2003 /* Compute the phase of the stack frame for this function. */
2005 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2006 int off = STARTING_FRAME_OFFSET % align;
2007 frame_phase = off ? align - off : 0;
2010 /* Set TREE_USED on all variables in the local_decls. */
2011 FOR_EACH_LOCAL_DECL (cfun, i, var)
2012 TREE_USED (var) = 1;
2013 /* Clear TREE_USED on all variables associated with a block scope. */
2014 clear_tree_used (DECL_INITIAL (current_function_decl));
2016 init_vars_expansion ();
2018 if (targetm.use_pseudo_pic_reg ())
2019 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2021 for (i = 0; i < SA.map->num_partitions; i++)
2023 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2024 continue;
2026 tree var = partition_to_var (SA.map, i);
2028 gcc_assert (!virtual_operand_p (var));
2030 expand_one_ssa_partition (var);
2033 if (flag_stack_protect == SPCT_FLAG_STRONG)
2034 gen_stack_protect_signal
2035 = stack_protect_decl_p () || stack_protect_return_slot_p ();
2037 /* At this point all variables on the local_decls with TREE_USED
2038 set are not associated with any block scope. Lay them out. */
2040 len = vec_safe_length (cfun->local_decls);
2041 FOR_EACH_LOCAL_DECL (cfun, i, var)
2043 bool expand_now = false;
2045 /* Expanded above already. */
2046 if (is_gimple_reg (var))
2048 TREE_USED (var) = 0;
2049 goto next;
2051 /* We didn't set a block for static or extern because it's hard
2052 to tell the difference between a global variable (re)declared
2053 in a local scope, and one that's really declared there to
2054 begin with. And it doesn't really matter much, since we're
2055 not giving them stack space. Expand them now. */
2056 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2057 expand_now = true;
2059 /* Expand variables not associated with any block now. Those created by
2060 the optimizers could be live anywhere in the function. Those that
2061 could possibly have been scoped originally and detached from their
2062 block will have their allocation deferred so we coalesce them with
2063 others when optimization is enabled. */
2064 else if (TREE_USED (var))
2065 expand_now = true;
2067 /* Finally, mark all variables on the list as used. We'll use
2068 this in a moment when we expand those associated with scopes. */
2069 TREE_USED (var) = 1;
2071 if (expand_now)
2072 expand_one_var (var, true, true);
2074 next:
2075 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2077 rtx rtl = DECL_RTL_IF_SET (var);
2079 /* Keep artificial non-ignored vars in cfun->local_decls
2080 chain until instantiate_decls. */
2081 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2082 add_local_decl (cfun, var);
2083 else if (rtl == NULL_RTX)
2084 /* If rtl isn't set yet, which can happen e.g. with
2085 -fstack-protector, retry before returning from this
2086 function. */
2087 maybe_local_decls.safe_push (var);
2091 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2093 +-----------------+-----------------+
2094 | ...processed... | ...duplicates...|
2095 +-----------------+-----------------+
2097 +-- LEN points here.
2099 We just want the duplicates, as those are the artificial
2100 non-ignored vars that we want to keep until instantiate_decls.
2101 Move them down and truncate the array. */
2102 if (!vec_safe_is_empty (cfun->local_decls))
2103 cfun->local_decls->block_remove (0, len);
2105 /* At this point, all variables within the block tree with TREE_USED
2106 set are actually used by the optimized function. Lay them out. */
2107 expand_used_vars_for_block (outer_block, true);
2109 if (stack_vars_num > 0)
2111 add_scope_conflicts ();
2113 /* If stack protection is enabled, we don't share space between
2114 vulnerable data and non-vulnerable data. */
2115 if (flag_stack_protect != 0
2116 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2117 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2118 && lookup_attribute ("stack_protect",
2119 DECL_ATTRIBUTES (current_function_decl)))))
2120 add_stack_protection_conflicts ();
2122 /* Now that we have collected all stack variables, and have computed a
2123 minimal interference graph, attempt to save some stack space. */
2124 partition_stack_vars ();
2125 if (dump_file)
2126 dump_stack_var_partition ();
2129 switch (flag_stack_protect)
2131 case SPCT_FLAG_ALL:
2132 create_stack_guard ();
2133 break;
2135 case SPCT_FLAG_STRONG:
2136 if (gen_stack_protect_signal
2137 || cfun->calls_alloca || has_protected_decls
2138 || lookup_attribute ("stack_protect",
2139 DECL_ATTRIBUTES (current_function_decl)))
2140 create_stack_guard ();
2141 break;
2143 case SPCT_FLAG_DEFAULT:
2144 if (cfun->calls_alloca || has_protected_decls
2145 || lookup_attribute ("stack_protect",
2146 DECL_ATTRIBUTES (current_function_decl)))
2147 create_stack_guard ();
2148 break;
2150 case SPCT_FLAG_EXPLICIT:
2151 if (lookup_attribute ("stack_protect",
2152 DECL_ATTRIBUTES (current_function_decl)))
2153 create_stack_guard ();
2154 break;
2155 default:
2159 /* Assign rtl to each variable based on these partitions. */
2160 if (stack_vars_num > 0)
2162 struct stack_vars_data data;
2164 data.asan_vec = vNULL;
2165 data.asan_decl_vec = vNULL;
2166 data.asan_base = NULL_RTX;
2167 data.asan_alignb = 0;
2169 /* Reorder decls to be protected by iterating over the variables
2170 array multiple times, and allocating out of each phase in turn. */
2171 /* ??? We could probably integrate this into the qsort we did
2172 earlier, such that we naturally see these variables first,
2173 and thus naturally allocate things in the right order. */
2174 if (has_protected_decls)
2176 /* Phase 1 contains only character arrays. */
2177 expand_stack_vars (stack_protect_decl_phase_1, &data);
2179 /* Phase 2 contains other kinds of arrays. */
2180 if (flag_stack_protect == SPCT_FLAG_ALL
2181 || flag_stack_protect == SPCT_FLAG_STRONG
2182 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2183 && lookup_attribute ("stack_protect",
2184 DECL_ATTRIBUTES (current_function_decl))))
2185 expand_stack_vars (stack_protect_decl_phase_2, &data);
2188 if ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK)
2189 /* Phase 3, any partitions that need asan protection
2190 in addition to phase 1 and 2. */
2191 expand_stack_vars (asan_decl_phase_3, &data);
2193 if (!data.asan_vec.is_empty ())
2195 HOST_WIDE_INT prev_offset = frame_offset;
2196 HOST_WIDE_INT offset, sz, redzonesz;
2197 redzonesz = ASAN_RED_ZONE_SIZE;
2198 sz = data.asan_vec[0] - prev_offset;
2199 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2200 && data.asan_alignb <= 4096
2201 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2202 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2203 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2204 offset
2205 = alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE);
2206 data.asan_vec.safe_push (prev_offset);
2207 data.asan_vec.safe_push (offset);
2208 /* Leave space for alignment if STRICT_ALIGNMENT. */
2209 if (STRICT_ALIGNMENT)
2210 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2211 << ASAN_SHADOW_SHIFT)
2212 / BITS_PER_UNIT, 1);
2214 var_end_seq
2215 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2216 data.asan_base,
2217 data.asan_alignb,
2218 data.asan_vec.address (),
2219 data.asan_decl_vec.address (),
2220 data.asan_vec.length ());
2223 expand_stack_vars (NULL, &data);
2225 data.asan_vec.release ();
2226 data.asan_decl_vec.release ();
2229 fini_vars_expansion ();
2231 /* If there were any artificial non-ignored vars without rtl
2232 found earlier, see if deferred stack allocation hasn't assigned
2233 rtl to them. */
2234 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2236 rtx rtl = DECL_RTL_IF_SET (var);
2238 /* Keep artificial non-ignored vars in cfun->local_decls
2239 chain until instantiate_decls. */
2240 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2241 add_local_decl (cfun, var);
2243 maybe_local_decls.release ();
2245 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2246 if (STACK_ALIGNMENT_NEEDED)
2248 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2249 if (!FRAME_GROWS_DOWNWARD)
2250 frame_offset += align - 1;
2251 frame_offset &= -align;
2254 return var_end_seq;
2258 /* If we need to produce a detailed dump, print the tree representation
2259 for STMT to the dump file. SINCE is the last RTX after which the RTL
2260 generated for STMT should have been appended. */
2262 static void
2263 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2265 if (dump_file && (dump_flags & TDF_DETAILS))
2267 fprintf (dump_file, "\n;; ");
2268 print_gimple_stmt (dump_file, stmt, 0,
2269 TDF_SLIM | (dump_flags & TDF_LINENO));
2270 fprintf (dump_file, "\n");
2272 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2276 /* Maps the blocks that do not contain tree labels to rtx labels. */
2278 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2280 /* Returns the label_rtx expression for a label starting basic block BB. */
2282 static rtx_code_label *
2283 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2285 gimple_stmt_iterator gsi;
2286 tree lab;
2288 if (bb->flags & BB_RTL)
2289 return block_label (bb);
2291 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2292 if (elt)
2293 return *elt;
2295 /* Find the tree label if it is present. */
2297 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2299 glabel *lab_stmt;
2301 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2302 if (!lab_stmt)
2303 break;
2305 lab = gimple_label_label (lab_stmt);
2306 if (DECL_NONLOCAL (lab))
2307 break;
2309 return jump_target_rtx (lab);
2312 rtx_code_label *l = gen_label_rtx ();
2313 lab_rtx_for_bb->put (bb, l);
2314 return l;
2318 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2319 of a basic block where we just expanded the conditional at the end,
2320 possibly clean up the CFG and instruction sequence. LAST is the
2321 last instruction before the just emitted jump sequence. */
2323 static void
2324 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2326 /* Special case: when jumpif decides that the condition is
2327 trivial it emits an unconditional jump (and the necessary
2328 barrier). But we still have two edges, the fallthru one is
2329 wrong. purge_dead_edges would clean this up later. Unfortunately
2330 we have to insert insns (and split edges) before
2331 find_many_sub_basic_blocks and hence before purge_dead_edges.
2332 But splitting edges might create new blocks which depend on the
2333 fact that if there are two edges there's no barrier. So the
2334 barrier would get lost and verify_flow_info would ICE. Instead
2335 of auditing all edge splitters to care for the barrier (which
2336 normally isn't there in a cleaned CFG), fix it here. */
2337 if (BARRIER_P (get_last_insn ()))
2339 rtx_insn *insn;
2340 remove_edge (e);
2341 /* Now, we have a single successor block, if we have insns to
2342 insert on the remaining edge we potentially will insert
2343 it at the end of this block (if the dest block isn't feasible)
2344 in order to avoid splitting the edge. This insertion will take
2345 place in front of the last jump. But we might have emitted
2346 multiple jumps (conditional and one unconditional) to the
2347 same destination. Inserting in front of the last one then
2348 is a problem. See PR 40021. We fix this by deleting all
2349 jumps except the last unconditional one. */
2350 insn = PREV_INSN (get_last_insn ());
2351 /* Make sure we have an unconditional jump. Otherwise we're
2352 confused. */
2353 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2354 for (insn = PREV_INSN (insn); insn != last;)
2356 insn = PREV_INSN (insn);
2357 if (JUMP_P (NEXT_INSN (insn)))
2359 if (!any_condjump_p (NEXT_INSN (insn)))
2361 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2362 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2364 delete_insn (NEXT_INSN (insn));
2370 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2371 Returns a new basic block if we've terminated the current basic
2372 block and created a new one. */
2374 static basic_block
2375 expand_gimple_cond (basic_block bb, gcond *stmt)
2377 basic_block new_bb, dest;
2378 edge new_edge;
2379 edge true_edge;
2380 edge false_edge;
2381 rtx_insn *last2, *last;
2382 enum tree_code code;
2383 tree op0, op1;
2385 code = gimple_cond_code (stmt);
2386 op0 = gimple_cond_lhs (stmt);
2387 op1 = gimple_cond_rhs (stmt);
2388 /* We're sometimes presented with such code:
2389 D.123_1 = x < y;
2390 if (D.123_1 != 0)
2392 This would expand to two comparisons which then later might
2393 be cleaned up by combine. But some pattern matchers like if-conversion
2394 work better when there's only one compare, so make up for this
2395 here as special exception if TER would have made the same change. */
2396 if (SA.values
2397 && TREE_CODE (op0) == SSA_NAME
2398 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2399 && TREE_CODE (op1) == INTEGER_CST
2400 && ((gimple_cond_code (stmt) == NE_EXPR
2401 && integer_zerop (op1))
2402 || (gimple_cond_code (stmt) == EQ_EXPR
2403 && integer_onep (op1)))
2404 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2406 gimple *second = SSA_NAME_DEF_STMT (op0);
2407 if (gimple_code (second) == GIMPLE_ASSIGN)
2409 enum tree_code code2 = gimple_assign_rhs_code (second);
2410 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2412 code = code2;
2413 op0 = gimple_assign_rhs1 (second);
2414 op1 = gimple_assign_rhs2 (second);
2416 /* If jumps are cheap and the target does not support conditional
2417 compare, turn some more codes into jumpy sequences. */
2418 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2419 && targetm.gen_ccmp_first == NULL)
2421 if ((code2 == BIT_AND_EXPR
2422 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2423 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2424 || code2 == TRUTH_AND_EXPR)
2426 code = TRUTH_ANDIF_EXPR;
2427 op0 = gimple_assign_rhs1 (second);
2428 op1 = gimple_assign_rhs2 (second);
2430 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2432 code = TRUTH_ORIF_EXPR;
2433 op0 = gimple_assign_rhs1 (second);
2434 op1 = gimple_assign_rhs2 (second);
2440 last2 = last = get_last_insn ();
2442 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2443 set_curr_insn_location (gimple_location (stmt));
2445 /* These flags have no purpose in RTL land. */
2446 true_edge->flags &= ~EDGE_TRUE_VALUE;
2447 false_edge->flags &= ~EDGE_FALSE_VALUE;
2449 /* We can either have a pure conditional jump with one fallthru edge or
2450 two-way jump that needs to be decomposed into two basic blocks. */
2451 if (false_edge->dest == bb->next_bb)
2453 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2454 true_edge->probability);
2455 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2456 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2457 set_curr_insn_location (true_edge->goto_locus);
2458 false_edge->flags |= EDGE_FALLTHRU;
2459 maybe_cleanup_end_of_block (false_edge, last);
2460 return NULL;
2462 if (true_edge->dest == bb->next_bb)
2464 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2465 false_edge->probability);
2466 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2467 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2468 set_curr_insn_location (false_edge->goto_locus);
2469 true_edge->flags |= EDGE_FALLTHRU;
2470 maybe_cleanup_end_of_block (true_edge, last);
2471 return NULL;
2474 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2475 true_edge->probability);
2476 last = get_last_insn ();
2477 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2478 set_curr_insn_location (false_edge->goto_locus);
2479 emit_jump (label_rtx_for_bb (false_edge->dest));
2481 BB_END (bb) = last;
2482 if (BARRIER_P (BB_END (bb)))
2483 BB_END (bb) = PREV_INSN (BB_END (bb));
2484 update_bb_for_insn (bb);
2486 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2487 dest = false_edge->dest;
2488 redirect_edge_succ (false_edge, new_bb);
2489 false_edge->flags |= EDGE_FALLTHRU;
2490 new_bb->count = false_edge->count;
2491 new_bb->frequency = EDGE_FREQUENCY (false_edge);
2492 add_bb_to_loop (new_bb, bb->loop_father);
2493 new_edge = make_edge (new_bb, dest, 0);
2494 new_edge->probability = REG_BR_PROB_BASE;
2495 new_edge->count = new_bb->count;
2496 if (BARRIER_P (BB_END (new_bb)))
2497 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2498 update_bb_for_insn (new_bb);
2500 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2502 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2504 set_curr_insn_location (true_edge->goto_locus);
2505 true_edge->goto_locus = curr_insn_location ();
2508 return new_bb;
2511 /* Mark all calls that can have a transaction restart. */
2513 static void
2514 mark_transaction_restart_calls (gimple *stmt)
2516 struct tm_restart_node dummy;
2517 tm_restart_node **slot;
2519 if (!cfun->gimple_df->tm_restart)
2520 return;
2522 dummy.stmt = stmt;
2523 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2524 if (slot)
2526 struct tm_restart_node *n = *slot;
2527 tree list = n->label_or_list;
2528 rtx_insn *insn;
2530 for (insn = next_real_insn (get_last_insn ());
2531 !CALL_P (insn);
2532 insn = next_real_insn (insn))
2533 continue;
2535 if (TREE_CODE (list) == LABEL_DECL)
2536 add_reg_note (insn, REG_TM, label_rtx (list));
2537 else
2538 for (; list ; list = TREE_CHAIN (list))
2539 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2543 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2544 statement STMT. */
2546 static void
2547 expand_call_stmt (gcall *stmt)
2549 tree exp, decl, lhs;
2550 bool builtin_p;
2551 size_t i;
2553 if (gimple_call_internal_p (stmt))
2555 expand_internal_call (stmt);
2556 return;
2559 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2561 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2562 decl = gimple_call_fndecl (stmt);
2563 builtin_p = decl && DECL_BUILT_IN (decl);
2565 /* If this is not a builtin function, the function type through which the
2566 call is made may be different from the type of the function. */
2567 if (!builtin_p)
2568 CALL_EXPR_FN (exp)
2569 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2570 CALL_EXPR_FN (exp));
2572 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2573 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2575 for (i = 0; i < gimple_call_num_args (stmt); i++)
2577 tree arg = gimple_call_arg (stmt, i);
2578 gimple *def;
2579 /* TER addresses into arguments of builtin functions so we have a
2580 chance to infer more correct alignment information. See PR39954. */
2581 if (builtin_p
2582 && TREE_CODE (arg) == SSA_NAME
2583 && (def = get_gimple_for_ssa_name (arg))
2584 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2585 arg = gimple_assign_rhs1 (def);
2586 CALL_EXPR_ARG (exp, i) = arg;
2589 if (gimple_has_side_effects (stmt))
2590 TREE_SIDE_EFFECTS (exp) = 1;
2592 if (gimple_call_nothrow_p (stmt))
2593 TREE_NOTHROW (exp) = 1;
2595 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2596 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2597 if (decl
2598 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
2599 && (DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA
2600 || DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA_WITH_ALIGN))
2601 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2602 else
2603 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2604 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2605 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2606 CALL_WITH_BOUNDS_P (exp) = gimple_call_with_bounds_p (stmt);
2608 /* Ensure RTL is created for debug args. */
2609 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2611 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2612 unsigned int ix;
2613 tree dtemp;
2615 if (debug_args)
2616 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2618 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2619 expand_debug_expr (dtemp);
2623 lhs = gimple_call_lhs (stmt);
2624 if (lhs)
2625 expand_assignment (lhs, exp, false);
2626 else
2627 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2629 mark_transaction_restart_calls (stmt);
2633 /* Generate RTL for an asm statement (explicit assembler code).
2634 STRING is a STRING_CST node containing the assembler code text,
2635 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2636 insn is volatile; don't optimize it. */
2638 static void
2639 expand_asm_loc (tree string, int vol, location_t locus)
2641 rtx body;
2643 if (TREE_CODE (string) == ADDR_EXPR)
2644 string = TREE_OPERAND (string, 0);
2646 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2647 ggc_strdup (TREE_STRING_POINTER (string)),
2648 locus);
2650 MEM_VOLATILE_P (body) = vol;
2652 emit_insn (body);
2655 /* Return the number of times character C occurs in string S. */
2656 static int
2657 n_occurrences (int c, const char *s)
2659 int n = 0;
2660 while (*s)
2661 n += (*s++ == c);
2662 return n;
2665 /* A subroutine of expand_asm_operands. Check that all operands have
2666 the same number of alternatives. Return true if so. */
2668 static bool
2669 check_operand_nalternatives (const vec<const char *> &constraints)
2671 unsigned len = constraints.length();
2672 if (len > 0)
2674 int nalternatives = n_occurrences (',', constraints[0]);
2676 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2678 error ("too many alternatives in %<asm%>");
2679 return false;
2682 for (unsigned i = 1; i < len; ++i)
2683 if (n_occurrences (',', constraints[i]) != nalternatives)
2685 error ("operand constraints for %<asm%> differ "
2686 "in number of alternatives");
2687 return false;
2690 return true;
2693 /* Check for overlap between registers marked in CLOBBERED_REGS and
2694 anything inappropriate in T. Emit error and return the register
2695 variable definition for error, NULL_TREE for ok. */
2697 static bool
2698 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2700 /* Conflicts between asm-declared register variables and the clobber
2701 list are not allowed. */
2702 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2704 if (overlap)
2706 error ("asm-specifier for variable %qE conflicts with asm clobber list",
2707 DECL_NAME (overlap));
2709 /* Reset registerness to stop multiple errors emitted for a single
2710 variable. */
2711 DECL_REGISTER (overlap) = 0;
2712 return true;
2715 return false;
2718 /* Generate RTL for an asm statement with arguments.
2719 STRING is the instruction template.
2720 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2721 Each output or input has an expression in the TREE_VALUE and
2722 a tree list in TREE_PURPOSE which in turn contains a constraint
2723 name in TREE_VALUE (or NULL_TREE) and a constraint string
2724 in TREE_PURPOSE.
2725 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2726 that is clobbered by this insn.
2728 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2729 should be the fallthru basic block of the asm goto.
2731 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2732 Some elements of OUTPUTS may be replaced with trees representing temporary
2733 values. The caller should copy those temporary values to the originally
2734 specified lvalues.
2736 VOL nonzero means the insn is volatile; don't optimize it. */
2738 static void
2739 expand_asm_stmt (gasm *stmt)
2741 class save_input_location
2743 location_t old;
2745 public:
2746 explicit save_input_location(location_t where)
2748 old = input_location;
2749 input_location = where;
2752 ~save_input_location()
2754 input_location = old;
2758 location_t locus = gimple_location (stmt);
2760 if (gimple_asm_input_p (stmt))
2762 const char *s = gimple_asm_string (stmt);
2763 tree string = build_string (strlen (s), s);
2764 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
2765 return;
2768 /* There are some legacy diagnostics in here, and also avoids a
2769 sixth parameger to targetm.md_asm_adjust. */
2770 save_input_location s_i_l(locus);
2772 unsigned noutputs = gimple_asm_noutputs (stmt);
2773 unsigned ninputs = gimple_asm_ninputs (stmt);
2774 unsigned nlabels = gimple_asm_nlabels (stmt);
2775 unsigned i;
2777 /* ??? Diagnose during gimplification? */
2778 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
2780 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2781 return;
2784 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
2785 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
2786 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
2788 /* Copy the gimple vectors into new vectors that we can manipulate. */
2790 output_tvec.safe_grow (noutputs);
2791 input_tvec.safe_grow (ninputs);
2792 constraints.safe_grow (noutputs + ninputs);
2794 for (i = 0; i < noutputs; ++i)
2796 tree t = gimple_asm_output_op (stmt, i);
2797 output_tvec[i] = TREE_VALUE (t);
2798 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2800 for (i = 0; i < ninputs; i++)
2802 tree t = gimple_asm_input_op (stmt, i);
2803 input_tvec[i] = TREE_VALUE (t);
2804 constraints[i + noutputs]
2805 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2808 /* ??? Diagnose during gimplification? */
2809 if (! check_operand_nalternatives (constraints))
2810 return;
2812 /* Count the number of meaningful clobbered registers, ignoring what
2813 we would ignore later. */
2814 auto_vec<rtx> clobber_rvec;
2815 HARD_REG_SET clobbered_regs;
2816 CLEAR_HARD_REG_SET (clobbered_regs);
2818 if (unsigned n = gimple_asm_nclobbers (stmt))
2820 clobber_rvec.reserve (n);
2821 for (i = 0; i < n; i++)
2823 tree t = gimple_asm_clobber_op (stmt, i);
2824 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
2825 int nregs, j;
2827 j = decode_reg_name_and_count (regname, &nregs);
2828 if (j < 0)
2830 if (j == -2)
2832 /* ??? Diagnose during gimplification? */
2833 error ("unknown register name %qs in %<asm%>", regname);
2835 else if (j == -4)
2837 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2838 clobber_rvec.safe_push (x);
2840 else
2842 /* Otherwise we should have -1 == empty string
2843 or -3 == cc, which is not a register. */
2844 gcc_assert (j == -1 || j == -3);
2847 else
2848 for (int reg = j; reg < j + nregs; reg++)
2850 /* Clobbering the PIC register is an error. */
2851 if (reg == (int) PIC_OFFSET_TABLE_REGNUM)
2853 /* ??? Diagnose during gimplification? */
2854 error ("PIC register clobbered by %qs in %<asm%>",
2855 regname);
2856 return;
2859 SET_HARD_REG_BIT (clobbered_regs, reg);
2860 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
2861 clobber_rvec.safe_push (x);
2865 unsigned nclobbers = clobber_rvec.length();
2867 /* First pass over inputs and outputs checks validity and sets
2868 mark_addressable if needed. */
2869 /* ??? Diagnose during gimplification? */
2871 for (i = 0; i < noutputs; ++i)
2873 tree val = output_tvec[i];
2874 tree type = TREE_TYPE (val);
2875 const char *constraint;
2876 bool is_inout;
2877 bool allows_reg;
2878 bool allows_mem;
2880 /* Try to parse the output constraint. If that fails, there's
2881 no point in going further. */
2882 constraint = constraints[i];
2883 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
2884 &allows_mem, &allows_reg, &is_inout))
2885 return;
2887 if (! allows_reg
2888 && (allows_mem
2889 || is_inout
2890 || (DECL_P (val)
2891 && REG_P (DECL_RTL (val))
2892 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
2893 mark_addressable (val);
2896 for (i = 0; i < ninputs; ++i)
2898 bool allows_reg, allows_mem;
2899 const char *constraint;
2901 constraint = constraints[i + noutputs];
2902 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
2903 constraints.address (),
2904 &allows_mem, &allows_reg))
2905 return;
2907 if (! allows_reg && allows_mem)
2908 mark_addressable (input_tvec[i]);
2911 /* Second pass evaluates arguments. */
2913 /* Make sure stack is consistent for asm goto. */
2914 if (nlabels > 0)
2915 do_pending_stack_adjust ();
2916 int old_generating_concat_p = generating_concat_p;
2918 /* Vector of RTX's of evaluated output operands. */
2919 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
2920 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
2921 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
2923 output_rvec.safe_grow (noutputs);
2925 for (i = 0; i < noutputs; ++i)
2927 tree val = output_tvec[i];
2928 tree type = TREE_TYPE (val);
2929 bool is_inout, allows_reg, allows_mem, ok;
2930 rtx op;
2932 ok = parse_output_constraint (&constraints[i], i, ninputs,
2933 noutputs, &allows_mem, &allows_reg,
2934 &is_inout);
2935 gcc_assert (ok);
2937 /* If an output operand is not a decl or indirect ref and our constraint
2938 allows a register, make a temporary to act as an intermediate.
2939 Make the asm insn write into that, then we will copy it to
2940 the real output operand. Likewise for promoted variables. */
2942 generating_concat_p = 0;
2944 if ((TREE_CODE (val) == INDIRECT_REF
2945 && allows_mem)
2946 || (DECL_P (val)
2947 && (allows_mem || REG_P (DECL_RTL (val)))
2948 && ! (REG_P (DECL_RTL (val))
2949 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
2950 || ! allows_reg
2951 || is_inout)
2953 op = expand_expr (val, NULL_RTX, VOIDmode,
2954 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
2955 if (MEM_P (op))
2956 op = validize_mem (op);
2958 if (! allows_reg && !MEM_P (op))
2959 error ("output number %d not directly addressable", i);
2960 if ((! allows_mem && MEM_P (op))
2961 || GET_CODE (op) == CONCAT)
2963 rtx old_op = op;
2964 op = gen_reg_rtx (GET_MODE (op));
2966 generating_concat_p = old_generating_concat_p;
2968 if (is_inout)
2969 emit_move_insn (op, old_op);
2971 push_to_sequence2 (after_rtl_seq, after_rtl_end);
2972 emit_move_insn (old_op, op);
2973 after_rtl_seq = get_insns ();
2974 after_rtl_end = get_last_insn ();
2975 end_sequence ();
2978 else
2980 op = assign_temp (type, 0, 1);
2981 op = validize_mem (op);
2982 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
2983 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
2985 generating_concat_p = old_generating_concat_p;
2987 push_to_sequence2 (after_rtl_seq, after_rtl_end);
2988 expand_assignment (val, make_tree (type, op), false);
2989 after_rtl_seq = get_insns ();
2990 after_rtl_end = get_last_insn ();
2991 end_sequence ();
2993 output_rvec[i] = op;
2995 if (is_inout)
2996 inout_opnum.safe_push (i);
2999 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3000 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3002 input_rvec.safe_grow (ninputs);
3003 input_mode.safe_grow (ninputs);
3005 generating_concat_p = 0;
3007 for (i = 0; i < ninputs; ++i)
3009 tree val = input_tvec[i];
3010 tree type = TREE_TYPE (val);
3011 bool allows_reg, allows_mem, ok;
3012 const char *constraint;
3013 rtx op;
3015 constraint = constraints[i + noutputs];
3016 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3017 constraints.address (),
3018 &allows_mem, &allows_reg);
3019 gcc_assert (ok);
3021 /* EXPAND_INITIALIZER will not generate code for valid initializer
3022 constants, but will still generate code for other types of operand.
3023 This is the behavior we want for constant constraints. */
3024 op = expand_expr (val, NULL_RTX, VOIDmode,
3025 allows_reg ? EXPAND_NORMAL
3026 : allows_mem ? EXPAND_MEMORY
3027 : EXPAND_INITIALIZER);
3029 /* Never pass a CONCAT to an ASM. */
3030 if (GET_CODE (op) == CONCAT)
3031 op = force_reg (GET_MODE (op), op);
3032 else if (MEM_P (op))
3033 op = validize_mem (op);
3035 if (asm_operand_ok (op, constraint, NULL) <= 0)
3037 if (allows_reg && TYPE_MODE (type) != BLKmode)
3038 op = force_reg (TYPE_MODE (type), op);
3039 else if (!allows_mem)
3040 warning (0, "asm operand %d probably doesn%'t match constraints",
3041 i + noutputs);
3042 else if (MEM_P (op))
3044 /* We won't recognize either volatile memory or memory
3045 with a queued address as available a memory_operand
3046 at this point. Ignore it: clearly this *is* a memory. */
3048 else
3049 gcc_unreachable ();
3051 input_rvec[i] = op;
3052 input_mode[i] = TYPE_MODE (type);
3055 /* For in-out operands, copy output rtx to input rtx. */
3056 unsigned ninout = inout_opnum.length();
3057 for (i = 0; i < ninout; i++)
3059 int j = inout_opnum[i];
3060 rtx o = output_rvec[j];
3062 input_rvec.safe_push (o);
3063 input_mode.safe_push (GET_MODE (o));
3065 char buffer[16];
3066 sprintf (buffer, "%d", j);
3067 constraints.safe_push (ggc_strdup (buffer));
3069 ninputs += ninout;
3071 /* Sometimes we wish to automatically clobber registers across an asm.
3072 Case in point is when the i386 backend moved from cc0 to a hard reg --
3073 maintaining source-level compatibility means automatically clobbering
3074 the flags register. */
3075 rtx_insn *after_md_seq = NULL;
3076 if (targetm.md_asm_adjust)
3077 after_md_seq = targetm.md_asm_adjust (output_rvec, input_rvec,
3078 constraints, clobber_rvec,
3079 clobbered_regs);
3081 /* Do not allow the hook to change the output and input count,
3082 lest it mess up the operand numbering. */
3083 gcc_assert (output_rvec.length() == noutputs);
3084 gcc_assert (input_rvec.length() == ninputs);
3085 gcc_assert (constraints.length() == noutputs + ninputs);
3087 /* But it certainly can adjust the clobbers. */
3088 nclobbers = clobber_rvec.length();
3090 /* Third pass checks for easy conflicts. */
3091 /* ??? Why are we doing this on trees instead of rtx. */
3093 bool clobber_conflict_found = 0;
3094 for (i = 0; i < noutputs; ++i)
3095 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3096 clobber_conflict_found = 1;
3097 for (i = 0; i < ninputs - ninout; ++i)
3098 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3099 clobber_conflict_found = 1;
3101 /* Make vectors for the expression-rtx, constraint strings,
3102 and named operands. */
3104 rtvec argvec = rtvec_alloc (ninputs);
3105 rtvec constraintvec = rtvec_alloc (ninputs);
3106 rtvec labelvec = rtvec_alloc (nlabels);
3108 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3109 : GET_MODE (output_rvec[0])),
3110 ggc_strdup (gimple_asm_string (stmt)),
3111 empty_string, 0, argvec, constraintvec,
3112 labelvec, locus);
3113 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3115 for (i = 0; i < ninputs; ++i)
3117 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3118 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3119 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3120 constraints[i + noutputs],
3121 locus);
3124 /* Copy labels to the vector. */
3125 rtx_code_label *fallthru_label = NULL;
3126 if (nlabels > 0)
3128 basic_block fallthru_bb = NULL;
3129 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3130 if (fallthru)
3131 fallthru_bb = fallthru->dest;
3133 for (i = 0; i < nlabels; ++i)
3135 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3136 rtx_insn *r;
3137 /* If asm goto has any labels in the fallthru basic block, use
3138 a label that we emit immediately after the asm goto. Expansion
3139 may insert further instructions into the same basic block after
3140 asm goto and if we don't do this, insertion of instructions on
3141 the fallthru edge might misbehave. See PR58670. */
3142 if (fallthru_bb && label_to_block_fn (cfun, label) == fallthru_bb)
3144 if (fallthru_label == NULL_RTX)
3145 fallthru_label = gen_label_rtx ();
3146 r = fallthru_label;
3148 else
3149 r = label_rtx (label);
3150 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3154 /* Now, for each output, construct an rtx
3155 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3156 ARGVEC CONSTRAINTS OPNAMES))
3157 If there is more than one, put them inside a PARALLEL. */
3159 if (nlabels > 0 && nclobbers == 0)
3161 gcc_assert (noutputs == 0);
3162 emit_jump_insn (body);
3164 else if (noutputs == 0 && nclobbers == 0)
3166 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3167 emit_insn (body);
3169 else if (noutputs == 1 && nclobbers == 0)
3171 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3172 emit_insn (gen_rtx_SET (output_rvec[0], body));
3174 else
3176 rtx obody = body;
3177 int num = noutputs;
3179 if (num == 0)
3180 num = 1;
3182 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3184 /* For each output operand, store a SET. */
3185 for (i = 0; i < noutputs; ++i)
3187 rtx src, o = output_rvec[i];
3188 if (i == 0)
3190 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3191 src = obody;
3193 else
3195 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3196 ASM_OPERANDS_TEMPLATE (obody),
3197 constraints[i], i, argvec,
3198 constraintvec, labelvec, locus);
3199 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3201 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3204 /* If there are no outputs (but there are some clobbers)
3205 store the bare ASM_OPERANDS into the PARALLEL. */
3206 if (i == 0)
3207 XVECEXP (body, 0, i++) = obody;
3209 /* Store (clobber REG) for each clobbered register specified. */
3210 for (unsigned j = 0; j < nclobbers; ++j)
3212 rtx clobbered_reg = clobber_rvec[j];
3214 /* Do sanity check for overlap between clobbers and respectively
3215 input and outputs that hasn't been handled. Such overlap
3216 should have been detected and reported above. */
3217 if (!clobber_conflict_found && REG_P (clobbered_reg))
3219 /* We test the old body (obody) contents to avoid
3220 tripping over the under-construction body. */
3221 for (unsigned k = 0; k < noutputs; ++k)
3222 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3223 internal_error ("asm clobber conflict with output operand");
3225 for (unsigned k = 0; k < ninputs - ninout; ++k)
3226 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3227 internal_error ("asm clobber conflict with input operand");
3230 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3233 if (nlabels > 0)
3234 emit_jump_insn (body);
3235 else
3236 emit_insn (body);
3239 generating_concat_p = old_generating_concat_p;
3241 if (fallthru_label)
3242 emit_label (fallthru_label);
3244 if (after_md_seq)
3245 emit_insn (after_md_seq);
3246 if (after_rtl_seq)
3247 emit_insn (after_rtl_seq);
3249 free_temp_slots ();
3250 crtl->has_asm_statement = 1;
3253 /* Emit code to jump to the address
3254 specified by the pointer expression EXP. */
3256 static void
3257 expand_computed_goto (tree exp)
3259 rtx x = expand_normal (exp);
3261 do_pending_stack_adjust ();
3262 emit_indirect_jump (x);
3265 /* Generate RTL code for a `goto' statement with target label LABEL.
3266 LABEL should be a LABEL_DECL tree node that was or will later be
3267 defined with `expand_label'. */
3269 static void
3270 expand_goto (tree label)
3272 #ifdef ENABLE_CHECKING
3273 /* Check for a nonlocal goto to a containing function. Should have
3274 gotten translated to __builtin_nonlocal_goto. */
3275 tree context = decl_function_context (label);
3276 gcc_assert (!context || context == current_function_decl);
3277 #endif
3279 emit_jump (jump_target_rtx (label));
3282 /* Output a return with no value. */
3284 static void
3285 expand_null_return_1 (void)
3287 clear_pending_stack_adjust ();
3288 do_pending_stack_adjust ();
3289 emit_jump (return_label);
3292 /* Generate RTL to return from the current function, with no value.
3293 (That is, we do not do anything about returning any value.) */
3295 void
3296 expand_null_return (void)
3298 /* If this function was declared to return a value, but we
3299 didn't, clobber the return registers so that they are not
3300 propagated live to the rest of the function. */
3301 clobber_return_register ();
3303 expand_null_return_1 ();
3306 /* Generate RTL to return from the current function, with value VAL. */
3308 static void
3309 expand_value_return (rtx val)
3311 /* Copy the value to the return location unless it's already there. */
3313 tree decl = DECL_RESULT (current_function_decl);
3314 rtx return_reg = DECL_RTL (decl);
3315 if (return_reg != val)
3317 tree funtype = TREE_TYPE (current_function_decl);
3318 tree type = TREE_TYPE (decl);
3319 int unsignedp = TYPE_UNSIGNED (type);
3320 machine_mode old_mode = DECL_MODE (decl);
3321 machine_mode mode;
3322 if (DECL_BY_REFERENCE (decl))
3323 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3324 else
3325 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3327 if (mode != old_mode)
3328 val = convert_modes (mode, old_mode, val, unsignedp);
3330 if (GET_CODE (return_reg) == PARALLEL)
3331 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3332 else
3333 emit_move_insn (return_reg, val);
3336 expand_null_return_1 ();
3339 /* Generate RTL to evaluate the expression RETVAL and return it
3340 from the current function. */
3342 static void
3343 expand_return (tree retval, tree bounds)
3345 rtx result_rtl;
3346 rtx val = 0;
3347 tree retval_rhs;
3348 rtx bounds_rtl;
3350 /* If function wants no value, give it none. */
3351 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3353 expand_normal (retval);
3354 expand_null_return ();
3355 return;
3358 if (retval == error_mark_node)
3360 /* Treat this like a return of no value from a function that
3361 returns a value. */
3362 expand_null_return ();
3363 return;
3365 else if ((TREE_CODE (retval) == MODIFY_EXPR
3366 || TREE_CODE (retval) == INIT_EXPR)
3367 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3368 retval_rhs = TREE_OPERAND (retval, 1);
3369 else
3370 retval_rhs = retval;
3372 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3374 /* Put returned bounds to the right place. */
3375 bounds_rtl = DECL_BOUNDS_RTL (DECL_RESULT (current_function_decl));
3376 if (bounds_rtl)
3378 rtx addr = NULL;
3379 rtx bnd = NULL;
3381 if (bounds && bounds != error_mark_node)
3383 bnd = expand_normal (bounds);
3384 targetm.calls.store_returned_bounds (bounds_rtl, bnd);
3386 else if (REG_P (bounds_rtl))
3388 if (bounds)
3389 bnd = chkp_expand_zero_bounds ();
3390 else
3392 addr = expand_normal (build_fold_addr_expr (retval_rhs));
3393 addr = gen_rtx_MEM (Pmode, addr);
3394 bnd = targetm.calls.load_bounds_for_arg (addr, NULL, NULL);
3397 targetm.calls.store_returned_bounds (bounds_rtl, bnd);
3399 else
3401 int n;
3403 gcc_assert (GET_CODE (bounds_rtl) == PARALLEL);
3405 if (bounds)
3406 bnd = chkp_expand_zero_bounds ();
3407 else
3409 addr = expand_normal (build_fold_addr_expr (retval_rhs));
3410 addr = gen_rtx_MEM (Pmode, addr);
3413 for (n = 0; n < XVECLEN (bounds_rtl, 0); n++)
3415 rtx slot = XEXP (XVECEXP (bounds_rtl, 0, n), 0);
3416 if (!bounds)
3418 rtx offs = XEXP (XVECEXP (bounds_rtl, 0, n), 1);
3419 rtx from = adjust_address (addr, Pmode, INTVAL (offs));
3420 bnd = targetm.calls.load_bounds_for_arg (from, NULL, NULL);
3422 targetm.calls.store_returned_bounds (slot, bnd);
3426 else if (chkp_function_instrumented_p (current_function_decl)
3427 && !BOUNDED_P (retval_rhs)
3428 && chkp_type_has_pointer (TREE_TYPE (retval_rhs))
3429 && TREE_CODE (retval_rhs) != RESULT_DECL)
3431 rtx addr = expand_normal (build_fold_addr_expr (retval_rhs));
3432 addr = gen_rtx_MEM (Pmode, addr);
3434 gcc_assert (MEM_P (result_rtl));
3436 chkp_copy_bounds_for_stack_parm (result_rtl, addr, TREE_TYPE (retval_rhs));
3439 /* If we are returning the RESULT_DECL, then the value has already
3440 been stored into it, so we don't have to do anything special. */
3441 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3442 expand_value_return (result_rtl);
3444 /* If the result is an aggregate that is being returned in one (or more)
3445 registers, load the registers here. */
3447 else if (retval_rhs != 0
3448 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3449 && REG_P (result_rtl))
3451 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3452 if (val)
3454 /* Use the mode of the result value on the return register. */
3455 PUT_MODE (result_rtl, GET_MODE (val));
3456 expand_value_return (val);
3458 else
3459 expand_null_return ();
3461 else if (retval_rhs != 0
3462 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3463 && (REG_P (result_rtl)
3464 || (GET_CODE (result_rtl) == PARALLEL)))
3466 /* Compute the return value into a temporary (usually a pseudo reg). */
3468 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3469 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3470 val = force_not_mem (val);
3471 expand_value_return (val);
3473 else
3475 /* No hard reg used; calculate value into hard return reg. */
3476 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3477 expand_value_return (result_rtl);
3481 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3482 STMT that doesn't require special handling for outgoing edges. That
3483 is no tailcalls and no GIMPLE_COND. */
3485 static void
3486 expand_gimple_stmt_1 (gimple *stmt)
3488 tree op0;
3490 set_curr_insn_location (gimple_location (stmt));
3492 switch (gimple_code (stmt))
3494 case GIMPLE_GOTO:
3495 op0 = gimple_goto_dest (stmt);
3496 if (TREE_CODE (op0) == LABEL_DECL)
3497 expand_goto (op0);
3498 else
3499 expand_computed_goto (op0);
3500 break;
3501 case GIMPLE_LABEL:
3502 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3503 break;
3504 case GIMPLE_NOP:
3505 case GIMPLE_PREDICT:
3506 break;
3507 case GIMPLE_SWITCH:
3508 expand_case (as_a <gswitch *> (stmt));
3509 break;
3510 case GIMPLE_ASM:
3511 expand_asm_stmt (as_a <gasm *> (stmt));
3512 break;
3513 case GIMPLE_CALL:
3514 expand_call_stmt (as_a <gcall *> (stmt));
3515 break;
3517 case GIMPLE_RETURN:
3519 tree bnd = gimple_return_retbnd (as_a <greturn *> (stmt));
3520 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3522 if (op0 && op0 != error_mark_node)
3524 tree result = DECL_RESULT (current_function_decl);
3526 /* If we are not returning the current function's RESULT_DECL,
3527 build an assignment to it. */
3528 if (op0 != result)
3530 /* I believe that a function's RESULT_DECL is unique. */
3531 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3533 /* ??? We'd like to use simply expand_assignment here,
3534 but this fails if the value is of BLKmode but the return
3535 decl is a register. expand_return has special handling
3536 for this combination, which eventually should move
3537 to common code. See comments there. Until then, let's
3538 build a modify expression :-/ */
3539 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3540 result, op0);
3542 /* Mark we have return statement with missing bounds. */
3543 if (!bnd && chkp_function_instrumented_p (cfun->decl))
3544 bnd = error_mark_node;
3547 if (!op0)
3548 expand_null_return ();
3549 else
3550 expand_return (op0, bnd);
3552 break;
3554 case GIMPLE_ASSIGN:
3556 gassign *assign_stmt = as_a <gassign *> (stmt);
3557 tree lhs = gimple_assign_lhs (assign_stmt);
3559 /* Tree expand used to fiddle with |= and &= of two bitfield
3560 COMPONENT_REFs here. This can't happen with gimple, the LHS
3561 of binary assigns must be a gimple reg. */
3563 if (TREE_CODE (lhs) != SSA_NAME
3564 || get_gimple_rhs_class (gimple_expr_code (stmt))
3565 == GIMPLE_SINGLE_RHS)
3567 tree rhs = gimple_assign_rhs1 (assign_stmt);
3568 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt))
3569 == GIMPLE_SINGLE_RHS);
3570 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3571 /* Do not put locations on possibly shared trees. */
3572 && !is_gimple_min_invariant (rhs))
3573 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3574 if (TREE_CLOBBER_P (rhs))
3575 /* This is a clobber to mark the going out of scope for
3576 this LHS. */
3578 else
3579 expand_assignment (lhs, rhs,
3580 gimple_assign_nontemporal_move_p (
3581 assign_stmt));
3583 else
3585 rtx target, temp;
3586 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3587 struct separate_ops ops;
3588 bool promoted = false;
3590 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3591 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3592 promoted = true;
3594 ops.code = gimple_assign_rhs_code (assign_stmt);
3595 ops.type = TREE_TYPE (lhs);
3596 switch (get_gimple_rhs_class (ops.code))
3598 case GIMPLE_TERNARY_RHS:
3599 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3600 /* Fallthru */
3601 case GIMPLE_BINARY_RHS:
3602 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3603 /* Fallthru */
3604 case GIMPLE_UNARY_RHS:
3605 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3606 break;
3607 default:
3608 gcc_unreachable ();
3610 ops.location = gimple_location (stmt);
3612 /* If we want to use a nontemporal store, force the value to
3613 register first. If we store into a promoted register,
3614 don't directly expand to target. */
3615 temp = nontemporal || promoted ? NULL_RTX : target;
3616 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3617 EXPAND_NORMAL);
3619 if (temp == target)
3621 else if (promoted)
3623 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3624 /* If TEMP is a VOIDmode constant, use convert_modes to make
3625 sure that we properly convert it. */
3626 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3628 temp = convert_modes (GET_MODE (target),
3629 TYPE_MODE (ops.type),
3630 temp, unsignedp);
3631 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3632 GET_MODE (target), temp, unsignedp);
3635 convert_move (SUBREG_REG (target), temp, unsignedp);
3637 else if (nontemporal && emit_storent_insn (target, temp))
3639 else
3641 temp = force_operand (temp, target);
3642 if (temp != target)
3643 emit_move_insn (target, temp);
3647 break;
3649 default:
3650 gcc_unreachable ();
3654 /* Expand one gimple statement STMT and return the last RTL instruction
3655 before any of the newly generated ones.
3657 In addition to generating the necessary RTL instructions this also
3658 sets REG_EH_REGION notes if necessary and sets the current source
3659 location for diagnostics. */
3661 static rtx_insn *
3662 expand_gimple_stmt (gimple *stmt)
3664 location_t saved_location = input_location;
3665 rtx_insn *last = get_last_insn ();
3666 int lp_nr;
3668 gcc_assert (cfun);
3670 /* We need to save and restore the current source location so that errors
3671 discovered during expansion are emitted with the right location. But
3672 it would be better if the diagnostic routines used the source location
3673 embedded in the tree nodes rather than globals. */
3674 if (gimple_has_location (stmt))
3675 input_location = gimple_location (stmt);
3677 expand_gimple_stmt_1 (stmt);
3679 /* Free any temporaries used to evaluate this statement. */
3680 free_temp_slots ();
3682 input_location = saved_location;
3684 /* Mark all insns that may trap. */
3685 lp_nr = lookup_stmt_eh_lp (stmt);
3686 if (lp_nr)
3688 rtx_insn *insn;
3689 for (insn = next_real_insn (last); insn;
3690 insn = next_real_insn (insn))
3692 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3693 /* If we want exceptions for non-call insns, any
3694 may_trap_p instruction may throw. */
3695 && GET_CODE (PATTERN (insn)) != CLOBBER
3696 && GET_CODE (PATTERN (insn)) != USE
3697 && insn_could_throw_p (insn))
3698 make_reg_eh_region_note (insn, 0, lp_nr);
3702 return last;
3705 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3706 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3707 generated a tail call (something that might be denied by the ABI
3708 rules governing the call; see calls.c).
3710 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3711 can still reach the rest of BB. The case here is __builtin_sqrt,
3712 where the NaN result goes through the external function (with a
3713 tailcall) and the normal result happens via a sqrt instruction. */
3715 static basic_block
3716 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
3718 rtx_insn *last2, *last;
3719 edge e;
3720 edge_iterator ei;
3721 int probability;
3722 gcov_type count;
3724 last2 = last = expand_gimple_stmt (stmt);
3726 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3727 if (CALL_P (last) && SIBLING_CALL_P (last))
3728 goto found;
3730 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3732 *can_fallthru = true;
3733 return NULL;
3735 found:
3736 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3737 Any instructions emitted here are about to be deleted. */
3738 do_pending_stack_adjust ();
3740 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3741 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3742 EH or abnormal edges, we shouldn't have created a tail call in
3743 the first place. So it seems to me we should just be removing
3744 all edges here, or redirecting the existing fallthru edge to
3745 the exit block. */
3747 probability = 0;
3748 count = 0;
3750 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3752 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3754 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3756 e->dest->count -= e->count;
3757 e->dest->frequency -= EDGE_FREQUENCY (e);
3758 if (e->dest->count < 0)
3759 e->dest->count = 0;
3760 if (e->dest->frequency < 0)
3761 e->dest->frequency = 0;
3763 count += e->count;
3764 probability += e->probability;
3765 remove_edge (e);
3767 else
3768 ei_next (&ei);
3771 /* This is somewhat ugly: the call_expr expander often emits instructions
3772 after the sibcall (to perform the function return). These confuse the
3773 find_many_sub_basic_blocks code, so we need to get rid of these. */
3774 last = NEXT_INSN (last);
3775 gcc_assert (BARRIER_P (last));
3777 *can_fallthru = false;
3778 while (NEXT_INSN (last))
3780 /* For instance an sqrt builtin expander expands if with
3781 sibcall in the then and label for `else`. */
3782 if (LABEL_P (NEXT_INSN (last)))
3784 *can_fallthru = true;
3785 break;
3787 delete_insn (NEXT_INSN (last));
3790 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3791 | EDGE_SIBCALL);
3792 e->probability += probability;
3793 e->count += count;
3794 BB_END (bb) = last;
3795 update_bb_for_insn (bb);
3797 if (NEXT_INSN (last))
3799 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3801 last = BB_END (bb);
3802 if (BARRIER_P (last))
3803 BB_END (bb) = PREV_INSN (last);
3806 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3808 return bb;
3811 /* Return the difference between the floor and the truncated result of
3812 a signed division by OP1 with remainder MOD. */
3813 static rtx
3814 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3816 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
3817 return gen_rtx_IF_THEN_ELSE
3818 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3819 gen_rtx_IF_THEN_ELSE
3820 (mode, gen_rtx_LT (BImode,
3821 gen_rtx_DIV (mode, op1, mod),
3822 const0_rtx),
3823 constm1_rtx, const0_rtx),
3824 const0_rtx);
3827 /* Return the difference between the ceil and the truncated result of
3828 a signed division by OP1 with remainder MOD. */
3829 static rtx
3830 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3832 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
3833 return gen_rtx_IF_THEN_ELSE
3834 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3835 gen_rtx_IF_THEN_ELSE
3836 (mode, gen_rtx_GT (BImode,
3837 gen_rtx_DIV (mode, op1, mod),
3838 const0_rtx),
3839 const1_rtx, const0_rtx),
3840 const0_rtx);
3843 /* Return the difference between the ceil and the truncated result of
3844 an unsigned division by OP1 with remainder MOD. */
3845 static rtx
3846 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
3848 /* (mod != 0 ? 1 : 0) */
3849 return gen_rtx_IF_THEN_ELSE
3850 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3851 const1_rtx, const0_rtx);
3854 /* Return the difference between the rounded and the truncated result
3855 of a signed division by OP1 with remainder MOD. Halfway cases are
3856 rounded away from zero, rather than to the nearest even number. */
3857 static rtx
3858 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
3860 /* (abs (mod) >= abs (op1) - abs (mod)
3861 ? (op1 / mod > 0 ? 1 : -1)
3862 : 0) */
3863 return gen_rtx_IF_THEN_ELSE
3864 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
3865 gen_rtx_MINUS (mode,
3866 gen_rtx_ABS (mode, op1),
3867 gen_rtx_ABS (mode, mod))),
3868 gen_rtx_IF_THEN_ELSE
3869 (mode, gen_rtx_GT (BImode,
3870 gen_rtx_DIV (mode, op1, mod),
3871 const0_rtx),
3872 const1_rtx, constm1_rtx),
3873 const0_rtx);
3876 /* Return the difference between the rounded and the truncated result
3877 of a unsigned division by OP1 with remainder MOD. Halfway cases
3878 are rounded away from zero, rather than to the nearest even
3879 number. */
3880 static rtx
3881 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
3883 /* (mod >= op1 - mod ? 1 : 0) */
3884 return gen_rtx_IF_THEN_ELSE
3885 (mode, gen_rtx_GE (BImode, mod,
3886 gen_rtx_MINUS (mode, op1, mod)),
3887 const1_rtx, const0_rtx);
3890 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
3891 any rtl. */
3893 static rtx
3894 convert_debug_memory_address (machine_mode mode, rtx x,
3895 addr_space_t as)
3897 machine_mode xmode = GET_MODE (x);
3899 #ifndef POINTERS_EXTEND_UNSIGNED
3900 gcc_assert (mode == Pmode
3901 || mode == targetm.addr_space.address_mode (as));
3902 gcc_assert (xmode == mode || xmode == VOIDmode);
3903 #else
3904 rtx temp;
3906 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
3908 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
3909 return x;
3911 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
3912 x = lowpart_subreg (mode, x, xmode);
3913 else if (POINTERS_EXTEND_UNSIGNED > 0)
3914 x = gen_rtx_ZERO_EXTEND (mode, x);
3915 else if (!POINTERS_EXTEND_UNSIGNED)
3916 x = gen_rtx_SIGN_EXTEND (mode, x);
3917 else
3919 switch (GET_CODE (x))
3921 case SUBREG:
3922 if ((SUBREG_PROMOTED_VAR_P (x)
3923 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
3924 || (GET_CODE (SUBREG_REG (x)) == PLUS
3925 && REG_P (XEXP (SUBREG_REG (x), 0))
3926 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
3927 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
3928 && GET_MODE (SUBREG_REG (x)) == mode)
3929 return SUBREG_REG (x);
3930 break;
3931 case LABEL_REF:
3932 temp = gen_rtx_LABEL_REF (mode, LABEL_REF_LABEL (x));
3933 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
3934 return temp;
3935 case SYMBOL_REF:
3936 temp = shallow_copy_rtx (x);
3937 PUT_MODE (temp, mode);
3938 return temp;
3939 case CONST:
3940 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
3941 if (temp)
3942 temp = gen_rtx_CONST (mode, temp);
3943 return temp;
3944 case PLUS:
3945 case MINUS:
3946 if (CONST_INT_P (XEXP (x, 1)))
3948 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
3949 if (temp)
3950 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
3952 break;
3953 default:
3954 break;
3956 /* Don't know how to express ptr_extend as operation in debug info. */
3957 return NULL;
3959 #endif /* POINTERS_EXTEND_UNSIGNED */
3961 return x;
3964 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
3965 by avoid_deep_ter_for_debug. */
3967 static hash_map<tree, tree> *deep_ter_debug_map;
3969 /* Split too deep TER chains for debug stmts using debug temporaries. */
3971 static void
3972 avoid_deep_ter_for_debug (gimple *stmt, int depth)
3974 use_operand_p use_p;
3975 ssa_op_iter iter;
3976 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
3978 tree use = USE_FROM_PTR (use_p);
3979 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
3980 continue;
3981 gimple *g = get_gimple_for_ssa_name (use);
3982 if (g == NULL)
3983 continue;
3984 if (depth > 6 && !stmt_ends_bb_p (g))
3986 if (deep_ter_debug_map == NULL)
3987 deep_ter_debug_map = new hash_map<tree, tree>;
3989 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
3990 if (vexpr != NULL)
3991 continue;
3992 vexpr = make_node (DEBUG_EXPR_DECL);
3993 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
3994 DECL_ARTIFICIAL (vexpr) = 1;
3995 TREE_TYPE (vexpr) = TREE_TYPE (use);
3996 DECL_MODE (vexpr) = TYPE_MODE (TREE_TYPE (use));
3997 gimple_stmt_iterator gsi = gsi_for_stmt (g);
3998 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
3999 avoid_deep_ter_for_debug (def_temp, 0);
4001 else
4002 avoid_deep_ter_for_debug (g, depth + 1);
4006 /* Return an RTX equivalent to the value of the parameter DECL. */
4008 static rtx
4009 expand_debug_parm_decl (tree decl)
4011 rtx incoming = DECL_INCOMING_RTL (decl);
4013 if (incoming
4014 && GET_MODE (incoming) != BLKmode
4015 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4016 || (MEM_P (incoming)
4017 && REG_P (XEXP (incoming, 0))
4018 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4020 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4022 #ifdef HAVE_window_save
4023 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4024 If the target machine has an explicit window save instruction, the
4025 actual entry value is the corresponding OUTGOING_REGNO instead. */
4026 if (REG_P (incoming)
4027 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4028 incoming
4029 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4030 OUTGOING_REGNO (REGNO (incoming)), 0);
4031 else if (MEM_P (incoming))
4033 rtx reg = XEXP (incoming, 0);
4034 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4036 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4037 incoming = replace_equiv_address_nv (incoming, reg);
4039 else
4040 incoming = copy_rtx (incoming);
4042 #endif
4044 ENTRY_VALUE_EXP (rtl) = incoming;
4045 return rtl;
4048 if (incoming
4049 && GET_MODE (incoming) != BLKmode
4050 && !TREE_ADDRESSABLE (decl)
4051 && MEM_P (incoming)
4052 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4053 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4054 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4055 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4056 return copy_rtx (incoming);
4058 return NULL_RTX;
4061 /* Return an RTX equivalent to the value of the tree expression EXP. */
4063 static rtx
4064 expand_debug_expr (tree exp)
4066 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4067 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4068 machine_mode inner_mode = VOIDmode;
4069 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4070 addr_space_t as;
4072 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4074 case tcc_expression:
4075 switch (TREE_CODE (exp))
4077 case COND_EXPR:
4078 case DOT_PROD_EXPR:
4079 case SAD_EXPR:
4080 case WIDEN_MULT_PLUS_EXPR:
4081 case WIDEN_MULT_MINUS_EXPR:
4082 case FMA_EXPR:
4083 goto ternary;
4085 case TRUTH_ANDIF_EXPR:
4086 case TRUTH_ORIF_EXPR:
4087 case TRUTH_AND_EXPR:
4088 case TRUTH_OR_EXPR:
4089 case TRUTH_XOR_EXPR:
4090 goto binary;
4092 case TRUTH_NOT_EXPR:
4093 goto unary;
4095 default:
4096 break;
4098 break;
4100 ternary:
4101 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4102 if (!op2)
4103 return NULL_RTX;
4104 /* Fall through. */
4106 binary:
4107 case tcc_binary:
4108 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4109 if (!op1)
4110 return NULL_RTX;
4111 switch (TREE_CODE (exp))
4113 case LSHIFT_EXPR:
4114 case RSHIFT_EXPR:
4115 case LROTATE_EXPR:
4116 case RROTATE_EXPR:
4117 case WIDEN_LSHIFT_EXPR:
4118 /* Ensure second operand isn't wider than the first one. */
4119 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4120 if (SCALAR_INT_MODE_P (inner_mode))
4122 machine_mode opmode = mode;
4123 if (VECTOR_MODE_P (mode))
4124 opmode = GET_MODE_INNER (mode);
4125 if (SCALAR_INT_MODE_P (opmode)
4126 && (GET_MODE_PRECISION (opmode)
4127 < GET_MODE_PRECISION (inner_mode)))
4128 op1 = lowpart_subreg (opmode, op1, inner_mode);
4130 break;
4131 default:
4132 break;
4134 /* Fall through. */
4136 unary:
4137 case tcc_unary:
4138 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4139 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4140 if (!op0)
4141 return NULL_RTX;
4142 break;
4144 case tcc_comparison:
4145 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4146 goto binary;
4148 case tcc_type:
4149 case tcc_statement:
4150 gcc_unreachable ();
4152 case tcc_constant:
4153 case tcc_exceptional:
4154 case tcc_declaration:
4155 case tcc_reference:
4156 case tcc_vl_exp:
4157 break;
4160 switch (TREE_CODE (exp))
4162 case STRING_CST:
4163 if (!lookup_constant_def (exp))
4165 if (strlen (TREE_STRING_POINTER (exp)) + 1
4166 != (size_t) TREE_STRING_LENGTH (exp))
4167 return NULL_RTX;
4168 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4169 op0 = gen_rtx_MEM (BLKmode, op0);
4170 set_mem_attributes (op0, exp, 0);
4171 return op0;
4173 /* Fall through... */
4175 case INTEGER_CST:
4176 case REAL_CST:
4177 case FIXED_CST:
4178 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4179 return op0;
4181 case COMPLEX_CST:
4182 gcc_assert (COMPLEX_MODE_P (mode));
4183 op0 = expand_debug_expr (TREE_REALPART (exp));
4184 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4185 return gen_rtx_CONCAT (mode, op0, op1);
4187 case DEBUG_EXPR_DECL:
4188 op0 = DECL_RTL_IF_SET (exp);
4190 if (op0)
4191 return op0;
4193 op0 = gen_rtx_DEBUG_EXPR (mode);
4194 DEBUG_EXPR_TREE_DECL (op0) = exp;
4195 SET_DECL_RTL (exp, op0);
4197 return op0;
4199 case VAR_DECL:
4200 case PARM_DECL:
4201 case FUNCTION_DECL:
4202 case LABEL_DECL:
4203 case CONST_DECL:
4204 case RESULT_DECL:
4205 op0 = DECL_RTL_IF_SET (exp);
4207 /* This decl was probably optimized away. */
4208 if (!op0)
4210 if (TREE_CODE (exp) != VAR_DECL
4211 || DECL_EXTERNAL (exp)
4212 || !TREE_STATIC (exp)
4213 || !DECL_NAME (exp)
4214 || DECL_HARD_REGISTER (exp)
4215 || DECL_IN_CONSTANT_POOL (exp)
4216 || mode == VOIDmode)
4217 return NULL;
4219 op0 = make_decl_rtl_for_debug (exp);
4220 if (!MEM_P (op0)
4221 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4222 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4223 return NULL;
4225 else
4226 op0 = copy_rtx (op0);
4228 if (GET_MODE (op0) == BLKmode
4229 /* If op0 is not BLKmode, but mode is, adjust_mode
4230 below would ICE. While it is likely a FE bug,
4231 try to be robust here. See PR43166. */
4232 || mode == BLKmode
4233 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4235 gcc_assert (MEM_P (op0));
4236 op0 = adjust_address_nv (op0, mode, 0);
4237 return op0;
4240 /* Fall through. */
4242 adjust_mode:
4243 case PAREN_EXPR:
4244 CASE_CONVERT:
4246 inner_mode = GET_MODE (op0);
4248 if (mode == inner_mode)
4249 return op0;
4251 if (inner_mode == VOIDmode)
4253 if (TREE_CODE (exp) == SSA_NAME)
4254 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4255 else
4256 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4257 if (mode == inner_mode)
4258 return op0;
4261 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4263 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
4264 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4265 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
4266 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4267 else
4268 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4270 else if (FLOAT_MODE_P (mode))
4272 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4273 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4274 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4275 else
4276 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4278 else if (FLOAT_MODE_P (inner_mode))
4280 if (unsignedp)
4281 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4282 else
4283 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4285 else if (CONSTANT_P (op0)
4286 || GET_MODE_PRECISION (mode) <= GET_MODE_PRECISION (inner_mode))
4287 op0 = lowpart_subreg (mode, op0, inner_mode);
4288 else if (UNARY_CLASS_P (exp)
4289 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4290 : unsignedp)
4291 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4292 else
4293 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4295 return op0;
4298 case MEM_REF:
4299 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4301 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4302 TREE_OPERAND (exp, 0),
4303 TREE_OPERAND (exp, 1));
4304 if (newexp)
4305 return expand_debug_expr (newexp);
4307 /* FALLTHROUGH */
4308 case INDIRECT_REF:
4309 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4310 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4311 if (!op0)
4312 return NULL;
4314 if (TREE_CODE (exp) == MEM_REF)
4316 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4317 || (GET_CODE (op0) == PLUS
4318 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4319 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4320 Instead just use get_inner_reference. */
4321 goto component_ref;
4323 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4324 if (!op1 || !CONST_INT_P (op1))
4325 return NULL;
4327 op0 = plus_constant (inner_mode, op0, INTVAL (op1));
4330 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4332 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4333 op0, as);
4334 if (op0 == NULL_RTX)
4335 return NULL;
4337 op0 = gen_rtx_MEM (mode, op0);
4338 set_mem_attributes (op0, exp, 0);
4339 if (TREE_CODE (exp) == MEM_REF
4340 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4341 set_mem_expr (op0, NULL_TREE);
4342 set_mem_addr_space (op0, as);
4344 return op0;
4346 case TARGET_MEM_REF:
4347 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4348 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4349 return NULL;
4351 op0 = expand_debug_expr
4352 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4353 if (!op0)
4354 return NULL;
4356 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4357 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4358 op0, as);
4359 if (op0 == NULL_RTX)
4360 return NULL;
4362 op0 = gen_rtx_MEM (mode, op0);
4364 set_mem_attributes (op0, exp, 0);
4365 set_mem_addr_space (op0, as);
4367 return op0;
4369 component_ref:
4370 case ARRAY_REF:
4371 case ARRAY_RANGE_REF:
4372 case COMPONENT_REF:
4373 case BIT_FIELD_REF:
4374 case REALPART_EXPR:
4375 case IMAGPART_EXPR:
4376 case VIEW_CONVERT_EXPR:
4378 machine_mode mode1;
4379 HOST_WIDE_INT bitsize, bitpos;
4380 tree offset;
4381 int volatilep = 0;
4382 tree tem = get_inner_reference (exp, &bitsize, &bitpos, &offset,
4383 &mode1, &unsignedp, &volatilep, false);
4384 rtx orig_op0;
4386 if (bitsize == 0)
4387 return NULL;
4389 orig_op0 = op0 = expand_debug_expr (tem);
4391 if (!op0)
4392 return NULL;
4394 if (offset)
4396 machine_mode addrmode, offmode;
4398 if (!MEM_P (op0))
4399 return NULL;
4401 op0 = XEXP (op0, 0);
4402 addrmode = GET_MODE (op0);
4403 if (addrmode == VOIDmode)
4404 addrmode = Pmode;
4406 op1 = expand_debug_expr (offset);
4407 if (!op1)
4408 return NULL;
4410 offmode = GET_MODE (op1);
4411 if (offmode == VOIDmode)
4412 offmode = TYPE_MODE (TREE_TYPE (offset));
4414 if (addrmode != offmode)
4415 op1 = lowpart_subreg (addrmode, op1, offmode);
4417 /* Don't use offset_address here, we don't need a
4418 recognizable address, and we don't want to generate
4419 code. */
4420 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4421 op0, op1));
4424 if (MEM_P (op0))
4426 if (mode1 == VOIDmode)
4427 /* Bitfield. */
4428 mode1 = smallest_mode_for_size (bitsize, MODE_INT);
4429 if (bitpos >= BITS_PER_UNIT)
4431 op0 = adjust_address_nv (op0, mode1, bitpos / BITS_PER_UNIT);
4432 bitpos %= BITS_PER_UNIT;
4434 else if (bitpos < 0)
4436 HOST_WIDE_INT units
4437 = (-bitpos + BITS_PER_UNIT - 1) / BITS_PER_UNIT;
4438 op0 = adjust_address_nv (op0, mode1, units);
4439 bitpos += units * BITS_PER_UNIT;
4441 else if (bitpos == 0 && bitsize == GET_MODE_BITSIZE (mode))
4442 op0 = adjust_address_nv (op0, mode, 0);
4443 else if (GET_MODE (op0) != mode1)
4444 op0 = adjust_address_nv (op0, mode1, 0);
4445 else
4446 op0 = copy_rtx (op0);
4447 if (op0 == orig_op0)
4448 op0 = shallow_copy_rtx (op0);
4449 set_mem_attributes (op0, exp, 0);
4452 if (bitpos == 0 && mode == GET_MODE (op0))
4453 return op0;
4455 if (bitpos < 0)
4456 return NULL;
4458 if (GET_MODE (op0) == BLKmode)
4459 return NULL;
4461 if ((bitpos % BITS_PER_UNIT) == 0
4462 && bitsize == GET_MODE_BITSIZE (mode1))
4464 machine_mode opmode = GET_MODE (op0);
4466 if (opmode == VOIDmode)
4467 opmode = TYPE_MODE (TREE_TYPE (tem));
4469 /* This condition may hold if we're expanding the address
4470 right past the end of an array that turned out not to
4471 be addressable (i.e., the address was only computed in
4472 debug stmts). The gen_subreg below would rightfully
4473 crash, and the address doesn't really exist, so just
4474 drop it. */
4475 if (bitpos >= GET_MODE_BITSIZE (opmode))
4476 return NULL;
4478 if ((bitpos % GET_MODE_BITSIZE (mode)) == 0)
4479 return simplify_gen_subreg (mode, op0, opmode,
4480 bitpos / BITS_PER_UNIT);
4483 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4484 && TYPE_UNSIGNED (TREE_TYPE (exp))
4485 ? SIGN_EXTRACT
4486 : ZERO_EXTRACT, mode,
4487 GET_MODE (op0) != VOIDmode
4488 ? GET_MODE (op0)
4489 : TYPE_MODE (TREE_TYPE (tem)),
4490 op0, GEN_INT (bitsize), GEN_INT (bitpos));
4493 case ABS_EXPR:
4494 return simplify_gen_unary (ABS, mode, op0, mode);
4496 case NEGATE_EXPR:
4497 return simplify_gen_unary (NEG, mode, op0, mode);
4499 case BIT_NOT_EXPR:
4500 return simplify_gen_unary (NOT, mode, op0, mode);
4502 case FLOAT_EXPR:
4503 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4504 0)))
4505 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4506 inner_mode);
4508 case FIX_TRUNC_EXPR:
4509 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4510 inner_mode);
4512 case POINTER_PLUS_EXPR:
4513 /* For the rare target where pointers are not the same size as
4514 size_t, we need to check for mis-matched modes and correct
4515 the addend. */
4516 if (op0 && op1
4517 && GET_MODE (op0) != VOIDmode && GET_MODE (op1) != VOIDmode
4518 && GET_MODE (op0) != GET_MODE (op1))
4520 if (GET_MODE_BITSIZE (GET_MODE (op0)) < GET_MODE_BITSIZE (GET_MODE (op1))
4521 /* If OP0 is a partial mode, then we must truncate, even if it has
4522 the same bitsize as OP1 as GCC's representation of partial modes
4523 is opaque. */
4524 || (GET_MODE_CLASS (GET_MODE (op0)) == MODE_PARTIAL_INT
4525 && GET_MODE_BITSIZE (GET_MODE (op0)) == GET_MODE_BITSIZE (GET_MODE (op1))))
4526 op1 = simplify_gen_unary (TRUNCATE, GET_MODE (op0), op1,
4527 GET_MODE (op1));
4528 else
4529 /* We always sign-extend, regardless of the signedness of
4530 the operand, because the operand is always unsigned
4531 here even if the original C expression is signed. */
4532 op1 = simplify_gen_unary (SIGN_EXTEND, GET_MODE (op0), op1,
4533 GET_MODE (op1));
4535 /* Fall through. */
4536 case PLUS_EXPR:
4537 return simplify_gen_binary (PLUS, mode, op0, op1);
4539 case MINUS_EXPR:
4540 return simplify_gen_binary (MINUS, mode, op0, op1);
4542 case MULT_EXPR:
4543 return simplify_gen_binary (MULT, mode, op0, op1);
4545 case RDIV_EXPR:
4546 case TRUNC_DIV_EXPR:
4547 case EXACT_DIV_EXPR:
4548 if (unsignedp)
4549 return simplify_gen_binary (UDIV, mode, op0, op1);
4550 else
4551 return simplify_gen_binary (DIV, mode, op0, op1);
4553 case TRUNC_MOD_EXPR:
4554 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4556 case FLOOR_DIV_EXPR:
4557 if (unsignedp)
4558 return simplify_gen_binary (UDIV, mode, op0, op1);
4559 else
4561 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4562 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4563 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4564 return simplify_gen_binary (PLUS, mode, div, adj);
4567 case FLOOR_MOD_EXPR:
4568 if (unsignedp)
4569 return simplify_gen_binary (UMOD, mode, op0, op1);
4570 else
4572 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4573 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4574 adj = simplify_gen_unary (NEG, mode,
4575 simplify_gen_binary (MULT, mode, adj, op1),
4576 mode);
4577 return simplify_gen_binary (PLUS, mode, mod, adj);
4580 case CEIL_DIV_EXPR:
4581 if (unsignedp)
4583 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4584 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4585 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4586 return simplify_gen_binary (PLUS, mode, div, adj);
4588 else
4590 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4591 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4592 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4593 return simplify_gen_binary (PLUS, mode, div, adj);
4596 case CEIL_MOD_EXPR:
4597 if (unsignedp)
4599 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4600 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4601 adj = simplify_gen_unary (NEG, mode,
4602 simplify_gen_binary (MULT, mode, adj, op1),
4603 mode);
4604 return simplify_gen_binary (PLUS, mode, mod, adj);
4606 else
4608 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4609 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4610 adj = simplify_gen_unary (NEG, mode,
4611 simplify_gen_binary (MULT, mode, adj, op1),
4612 mode);
4613 return simplify_gen_binary (PLUS, mode, mod, adj);
4616 case ROUND_DIV_EXPR:
4617 if (unsignedp)
4619 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4620 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4621 rtx adj = round_udiv_adjust (mode, mod, op1);
4622 return simplify_gen_binary (PLUS, mode, div, adj);
4624 else
4626 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4627 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4628 rtx adj = round_sdiv_adjust (mode, mod, op1);
4629 return simplify_gen_binary (PLUS, mode, div, adj);
4632 case ROUND_MOD_EXPR:
4633 if (unsignedp)
4635 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4636 rtx adj = round_udiv_adjust (mode, mod, op1);
4637 adj = simplify_gen_unary (NEG, mode,
4638 simplify_gen_binary (MULT, mode, adj, op1),
4639 mode);
4640 return simplify_gen_binary (PLUS, mode, mod, adj);
4642 else
4644 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4645 rtx adj = round_sdiv_adjust (mode, mod, op1);
4646 adj = simplify_gen_unary (NEG, mode,
4647 simplify_gen_binary (MULT, mode, adj, op1),
4648 mode);
4649 return simplify_gen_binary (PLUS, mode, mod, adj);
4652 case LSHIFT_EXPR:
4653 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4655 case RSHIFT_EXPR:
4656 if (unsignedp)
4657 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4658 else
4659 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4661 case LROTATE_EXPR:
4662 return simplify_gen_binary (ROTATE, mode, op0, op1);
4664 case RROTATE_EXPR:
4665 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4667 case MIN_EXPR:
4668 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4670 case MAX_EXPR:
4671 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4673 case BIT_AND_EXPR:
4674 case TRUTH_AND_EXPR:
4675 return simplify_gen_binary (AND, mode, op0, op1);
4677 case BIT_IOR_EXPR:
4678 case TRUTH_OR_EXPR:
4679 return simplify_gen_binary (IOR, mode, op0, op1);
4681 case BIT_XOR_EXPR:
4682 case TRUTH_XOR_EXPR:
4683 return simplify_gen_binary (XOR, mode, op0, op1);
4685 case TRUTH_ANDIF_EXPR:
4686 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4688 case TRUTH_ORIF_EXPR:
4689 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4691 case TRUTH_NOT_EXPR:
4692 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4694 case LT_EXPR:
4695 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4696 op0, op1);
4698 case LE_EXPR:
4699 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4700 op0, op1);
4702 case GT_EXPR:
4703 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4704 op0, op1);
4706 case GE_EXPR:
4707 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4708 op0, op1);
4710 case EQ_EXPR:
4711 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4713 case NE_EXPR:
4714 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4716 case UNORDERED_EXPR:
4717 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4719 case ORDERED_EXPR:
4720 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4722 case UNLT_EXPR:
4723 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4725 case UNLE_EXPR:
4726 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4728 case UNGT_EXPR:
4729 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4731 case UNGE_EXPR:
4732 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4734 case UNEQ_EXPR:
4735 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4737 case LTGT_EXPR:
4738 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4740 case COND_EXPR:
4741 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4743 case COMPLEX_EXPR:
4744 gcc_assert (COMPLEX_MODE_P (mode));
4745 if (GET_MODE (op0) == VOIDmode)
4746 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4747 if (GET_MODE (op1) == VOIDmode)
4748 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4749 return gen_rtx_CONCAT (mode, op0, op1);
4751 case CONJ_EXPR:
4752 if (GET_CODE (op0) == CONCAT)
4753 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4754 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4755 XEXP (op0, 1),
4756 GET_MODE_INNER (mode)));
4757 else
4759 machine_mode imode = GET_MODE_INNER (mode);
4760 rtx re, im;
4762 if (MEM_P (op0))
4764 re = adjust_address_nv (op0, imode, 0);
4765 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4767 else
4769 machine_mode ifmode = int_mode_for_mode (mode);
4770 machine_mode ihmode = int_mode_for_mode (imode);
4771 rtx halfsize;
4772 if (ifmode == BLKmode || ihmode == BLKmode)
4773 return NULL;
4774 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4775 re = op0;
4776 if (mode != ifmode)
4777 re = gen_rtx_SUBREG (ifmode, re, 0);
4778 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4779 if (imode != ihmode)
4780 re = gen_rtx_SUBREG (imode, re, 0);
4781 im = copy_rtx (op0);
4782 if (mode != ifmode)
4783 im = gen_rtx_SUBREG (ifmode, im, 0);
4784 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4785 if (imode != ihmode)
4786 im = gen_rtx_SUBREG (imode, im, 0);
4788 im = gen_rtx_NEG (imode, im);
4789 return gen_rtx_CONCAT (mode, re, im);
4792 case ADDR_EXPR:
4793 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4794 if (!op0 || !MEM_P (op0))
4796 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
4797 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
4798 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
4799 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
4800 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
4801 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
4803 if (handled_component_p (TREE_OPERAND (exp, 0)))
4805 HOST_WIDE_INT bitoffset, bitsize, maxsize;
4806 tree decl
4807 = get_ref_base_and_extent (TREE_OPERAND (exp, 0),
4808 &bitoffset, &bitsize, &maxsize);
4809 if ((TREE_CODE (decl) == VAR_DECL
4810 || TREE_CODE (decl) == PARM_DECL
4811 || TREE_CODE (decl) == RESULT_DECL)
4812 && (!TREE_ADDRESSABLE (decl)
4813 || target_for_debug_bind (decl))
4814 && (bitoffset % BITS_PER_UNIT) == 0
4815 && bitsize > 0
4816 && bitsize == maxsize)
4818 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
4819 return plus_constant (mode, base, bitoffset / BITS_PER_UNIT);
4823 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
4824 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
4825 == ADDR_EXPR)
4827 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4828 0));
4829 if (op0 != NULL
4830 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4831 || (GET_CODE (op0) == PLUS
4832 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
4833 && CONST_INT_P (XEXP (op0, 1)))))
4835 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4836 1));
4837 if (!op1 || !CONST_INT_P (op1))
4838 return NULL;
4840 return plus_constant (mode, op0, INTVAL (op1));
4844 return NULL;
4847 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
4848 op0 = convert_debug_memory_address (mode, XEXP (op0, 0), as);
4850 return op0;
4852 case VECTOR_CST:
4854 unsigned i;
4856 op0 = gen_rtx_CONCATN
4857 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4859 for (i = 0; i < VECTOR_CST_NELTS (exp); ++i)
4861 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
4862 if (!op1)
4863 return NULL;
4864 XVECEXP (op0, 0, i) = op1;
4867 return op0;
4870 case CONSTRUCTOR:
4871 if (TREE_CLOBBER_P (exp))
4872 return NULL;
4873 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
4875 unsigned i;
4876 tree val;
4878 op0 = gen_rtx_CONCATN
4879 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4881 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
4883 op1 = expand_debug_expr (val);
4884 if (!op1)
4885 return NULL;
4886 XVECEXP (op0, 0, i) = op1;
4889 if (i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)))
4891 op1 = expand_debug_expr
4892 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
4894 if (!op1)
4895 return NULL;
4897 for (; i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)); i++)
4898 XVECEXP (op0, 0, i) = op1;
4901 return op0;
4903 else
4904 goto flag_unsupported;
4906 case CALL_EXPR:
4907 /* ??? Maybe handle some builtins? */
4908 return NULL;
4910 case SSA_NAME:
4912 gimple *g = get_gimple_for_ssa_name (exp);
4913 if (g)
4915 tree t = NULL_TREE;
4916 if (deep_ter_debug_map)
4918 tree *slot = deep_ter_debug_map->get (exp);
4919 if (slot)
4920 t = *slot;
4922 if (t == NULL_TREE)
4923 t = gimple_assign_rhs_to_tree (g);
4924 op0 = expand_debug_expr (t);
4925 if (!op0)
4926 return NULL;
4928 else
4930 /* If this is a reference to an incoming value of
4931 parameter that is never used in the code or where the
4932 incoming value is never used in the code, use
4933 PARM_DECL's DECL_RTL if set. */
4934 if (SSA_NAME_IS_DEFAULT_DEF (exp)
4935 && SSA_NAME_VAR (exp)
4936 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
4937 && has_zero_uses (exp))
4939 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
4940 if (op0)
4941 goto adjust_mode;
4942 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
4943 if (op0)
4944 goto adjust_mode;
4947 int part = var_to_partition (SA.map, exp);
4949 if (part == NO_PARTITION)
4950 return NULL;
4952 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
4954 op0 = copy_rtx (SA.partition_to_pseudo[part]);
4956 goto adjust_mode;
4959 case ERROR_MARK:
4960 return NULL;
4962 /* Vector stuff. For most of the codes we don't have rtl codes. */
4963 case REALIGN_LOAD_EXPR:
4964 case REDUC_MAX_EXPR:
4965 case REDUC_MIN_EXPR:
4966 case REDUC_PLUS_EXPR:
4967 case VEC_COND_EXPR:
4968 case VEC_PACK_FIX_TRUNC_EXPR:
4969 case VEC_PACK_SAT_EXPR:
4970 case VEC_PACK_TRUNC_EXPR:
4971 case VEC_UNPACK_FLOAT_HI_EXPR:
4972 case VEC_UNPACK_FLOAT_LO_EXPR:
4973 case VEC_UNPACK_HI_EXPR:
4974 case VEC_UNPACK_LO_EXPR:
4975 case VEC_WIDEN_MULT_HI_EXPR:
4976 case VEC_WIDEN_MULT_LO_EXPR:
4977 case VEC_WIDEN_MULT_EVEN_EXPR:
4978 case VEC_WIDEN_MULT_ODD_EXPR:
4979 case VEC_WIDEN_LSHIFT_HI_EXPR:
4980 case VEC_WIDEN_LSHIFT_LO_EXPR:
4981 case VEC_PERM_EXPR:
4982 return NULL;
4984 /* Misc codes. */
4985 case ADDR_SPACE_CONVERT_EXPR:
4986 case FIXED_CONVERT_EXPR:
4987 case OBJ_TYPE_REF:
4988 case WITH_SIZE_EXPR:
4989 return NULL;
4991 case DOT_PROD_EXPR:
4992 if (SCALAR_INT_MODE_P (GET_MODE (op0))
4993 && SCALAR_INT_MODE_P (mode))
4996 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4997 0)))
4998 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
4999 inner_mode);
5001 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5002 1)))
5003 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5004 inner_mode);
5005 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5006 return simplify_gen_binary (PLUS, mode, op0, op2);
5008 return NULL;
5010 case WIDEN_MULT_EXPR:
5011 case WIDEN_MULT_PLUS_EXPR:
5012 case WIDEN_MULT_MINUS_EXPR:
5013 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5014 && SCALAR_INT_MODE_P (mode))
5016 inner_mode = GET_MODE (op0);
5017 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5018 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5019 else
5020 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5021 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5022 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5023 else
5024 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5025 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5026 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5027 return op0;
5028 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5029 return simplify_gen_binary (PLUS, mode, op0, op2);
5030 else
5031 return simplify_gen_binary (MINUS, mode, op2, op0);
5033 return NULL;
5035 case MULT_HIGHPART_EXPR:
5036 /* ??? Similar to the above. */
5037 return NULL;
5039 case WIDEN_SUM_EXPR:
5040 case WIDEN_LSHIFT_EXPR:
5041 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5042 && SCALAR_INT_MODE_P (mode))
5045 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5046 0)))
5047 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5048 inner_mode);
5049 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5050 ? ASHIFT : PLUS, mode, op0, op1);
5052 return NULL;
5054 case FMA_EXPR:
5055 return simplify_gen_ternary (FMA, mode, inner_mode, op0, op1, op2);
5057 default:
5058 flag_unsupported:
5059 #ifdef ENABLE_CHECKING
5060 debug_tree (exp);
5061 gcc_unreachable ();
5062 #else
5063 return NULL;
5064 #endif
5068 /* Return an RTX equivalent to the source bind value of the tree expression
5069 EXP. */
5071 static rtx
5072 expand_debug_source_expr (tree exp)
5074 rtx op0 = NULL_RTX;
5075 machine_mode mode = VOIDmode, inner_mode;
5077 switch (TREE_CODE (exp))
5079 case PARM_DECL:
5081 mode = DECL_MODE (exp);
5082 op0 = expand_debug_parm_decl (exp);
5083 if (op0)
5084 break;
5085 /* See if this isn't an argument that has been completely
5086 optimized out. */
5087 if (!DECL_RTL_SET_P (exp)
5088 && !DECL_INCOMING_RTL (exp)
5089 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5091 tree aexp = DECL_ORIGIN (exp);
5092 if (DECL_CONTEXT (aexp)
5093 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5095 vec<tree, va_gc> **debug_args;
5096 unsigned int ix;
5097 tree ddecl;
5098 debug_args = decl_debug_args_lookup (current_function_decl);
5099 if (debug_args != NULL)
5101 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5102 ix += 2)
5103 if (ddecl == aexp)
5104 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5108 break;
5110 default:
5111 break;
5114 if (op0 == NULL_RTX)
5115 return NULL_RTX;
5117 inner_mode = GET_MODE (op0);
5118 if (mode == inner_mode)
5119 return op0;
5121 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5123 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
5124 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5125 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
5126 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5127 else
5128 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5130 else if (FLOAT_MODE_P (mode))
5131 gcc_unreachable ();
5132 else if (FLOAT_MODE_P (inner_mode))
5134 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5135 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5136 else
5137 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5139 else if (CONSTANT_P (op0)
5140 || GET_MODE_BITSIZE (mode) <= GET_MODE_BITSIZE (inner_mode))
5141 op0 = lowpart_subreg (mode, op0, inner_mode);
5142 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5143 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5144 else
5145 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5147 return op0;
5150 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5151 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5152 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5154 static void
5155 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5157 rtx exp = *exp_p;
5159 if (exp == NULL_RTX)
5160 return;
5162 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5163 return;
5165 if (depth == 4)
5167 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5168 rtx dval = make_debug_expr_from_rtl (exp);
5170 /* Emit a debug bind insn before INSN. */
5171 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5172 DEBUG_EXPR_TREE_DECL (dval), exp,
5173 VAR_INIT_STATUS_INITIALIZED);
5175 emit_debug_insn_before (bind, insn);
5176 *exp_p = dval;
5177 return;
5180 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5181 int i, j;
5182 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5183 switch (*format_ptr++)
5185 case 'e':
5186 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5187 break;
5189 case 'E':
5190 case 'V':
5191 for (j = 0; j < XVECLEN (exp, i); j++)
5192 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5193 break;
5195 default:
5196 break;
5200 /* Expand the _LOCs in debug insns. We run this after expanding all
5201 regular insns, so that any variables referenced in the function
5202 will have their DECL_RTLs set. */
5204 static void
5205 expand_debug_locations (void)
5207 rtx_insn *insn;
5208 rtx_insn *last = get_last_insn ();
5209 int save_strict_alias = flag_strict_aliasing;
5211 /* New alias sets while setting up memory attributes cause
5212 -fcompare-debug failures, even though it doesn't bring about any
5213 codegen changes. */
5214 flag_strict_aliasing = 0;
5216 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5217 if (DEBUG_INSN_P (insn))
5219 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5220 rtx val;
5221 rtx_insn *prev_insn, *insn2;
5222 machine_mode mode;
5224 if (value == NULL_TREE)
5225 val = NULL_RTX;
5226 else
5228 if (INSN_VAR_LOCATION_STATUS (insn)
5229 == VAR_INIT_STATUS_UNINITIALIZED)
5230 val = expand_debug_source_expr (value);
5231 /* The avoid_deep_ter_for_debug function inserts
5232 debug bind stmts after SSA_NAME definition, with the
5233 SSA_NAME as the whole bind location. Disable temporarily
5234 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5235 being defined in this DEBUG_INSN. */
5236 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5238 tree *slot = deep_ter_debug_map->get (value);
5239 if (slot)
5241 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5242 *slot = NULL_TREE;
5243 else
5244 slot = NULL;
5246 val = expand_debug_expr (value);
5247 if (slot)
5248 *slot = INSN_VAR_LOCATION_DECL (insn);
5250 else
5251 val = expand_debug_expr (value);
5252 gcc_assert (last == get_last_insn ());
5255 if (!val)
5256 val = gen_rtx_UNKNOWN_VAR_LOC ();
5257 else
5259 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5261 gcc_assert (mode == GET_MODE (val)
5262 || (GET_MODE (val) == VOIDmode
5263 && (CONST_SCALAR_INT_P (val)
5264 || GET_CODE (val) == CONST_FIXED
5265 || GET_CODE (val) == LABEL_REF)));
5268 INSN_VAR_LOCATION_LOC (insn) = val;
5269 prev_insn = PREV_INSN (insn);
5270 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5271 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5274 flag_strict_aliasing = save_strict_alias;
5277 /* Performs swapping operands of commutative operations to expand
5278 the expensive one first. */
5280 static void
5281 reorder_operands (basic_block bb)
5283 unsigned int *lattice; /* Hold cost of each statement. */
5284 unsigned int i = 0, n = 0;
5285 gimple_stmt_iterator gsi;
5286 gimple_seq stmts;
5287 gimple *stmt;
5288 bool swap;
5289 tree op0, op1;
5290 ssa_op_iter iter;
5291 use_operand_p use_p;
5292 gimple *def0, *def1;
5294 /* Compute cost of each statement using estimate_num_insns. */
5295 stmts = bb_seq (bb);
5296 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5298 stmt = gsi_stmt (gsi);
5299 if (!is_gimple_debug (stmt))
5300 gimple_set_uid (stmt, n++);
5302 lattice = XNEWVEC (unsigned int, n);
5303 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5305 unsigned cost;
5306 stmt = gsi_stmt (gsi);
5307 if (is_gimple_debug (stmt))
5308 continue;
5309 cost = estimate_num_insns (stmt, &eni_size_weights);
5310 lattice[i] = cost;
5311 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5313 tree use = USE_FROM_PTR (use_p);
5314 gimple *def_stmt;
5315 if (TREE_CODE (use) != SSA_NAME)
5316 continue;
5317 def_stmt = get_gimple_for_ssa_name (use);
5318 if (!def_stmt)
5319 continue;
5320 lattice[i] += lattice[gimple_uid (def_stmt)];
5322 i++;
5323 if (!is_gimple_assign (stmt)
5324 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5325 continue;
5326 op0 = gimple_op (stmt, 1);
5327 op1 = gimple_op (stmt, 2);
5328 if (TREE_CODE (op0) != SSA_NAME
5329 || TREE_CODE (op1) != SSA_NAME)
5330 continue;
5331 /* Swap operands if the second one is more expensive. */
5332 def0 = get_gimple_for_ssa_name (op0);
5333 def1 = get_gimple_for_ssa_name (op1);
5334 if (!def1)
5335 continue;
5336 swap = false;
5337 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5338 swap = true;
5339 if (swap)
5341 if (dump_file && (dump_flags & TDF_DETAILS))
5343 fprintf (dump_file, "Swap operands in stmt:\n");
5344 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5345 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5346 def0 ? lattice[gimple_uid (def0)] : 0,
5347 lattice[gimple_uid (def1)]);
5349 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5350 gimple_assign_rhs2_ptr (stmt));
5353 XDELETE (lattice);
5356 /* Expand basic block BB from GIMPLE trees to RTL. */
5358 static basic_block
5359 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5361 gimple_stmt_iterator gsi;
5362 gimple_seq stmts;
5363 gimple *stmt = NULL;
5364 rtx_note *note;
5365 rtx_insn *last;
5366 edge e;
5367 edge_iterator ei;
5369 if (dump_file)
5370 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5371 bb->index);
5373 /* Note that since we are now transitioning from GIMPLE to RTL, we
5374 cannot use the gsi_*_bb() routines because they expect the basic
5375 block to be in GIMPLE, instead of RTL. Therefore, we need to
5376 access the BB sequence directly. */
5377 if (optimize)
5378 reorder_operands (bb);
5379 stmts = bb_seq (bb);
5380 bb->il.gimple.seq = NULL;
5381 bb->il.gimple.phi_nodes = NULL;
5382 rtl_profile_for_bb (bb);
5383 init_rtl_bb_info (bb);
5384 bb->flags |= BB_RTL;
5386 /* Remove the RETURN_EXPR if we may fall though to the exit
5387 instead. */
5388 gsi = gsi_last (stmts);
5389 if (!gsi_end_p (gsi)
5390 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5392 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5394 gcc_assert (single_succ_p (bb));
5395 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5397 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5398 && !gimple_return_retval (ret_stmt))
5400 gsi_remove (&gsi, false);
5401 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5405 gsi = gsi_start (stmts);
5406 if (!gsi_end_p (gsi))
5408 stmt = gsi_stmt (gsi);
5409 if (gimple_code (stmt) != GIMPLE_LABEL)
5410 stmt = NULL;
5413 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5415 if (stmt || elt)
5417 last = get_last_insn ();
5419 if (stmt)
5421 expand_gimple_stmt (stmt);
5422 gsi_next (&gsi);
5425 if (elt)
5426 emit_label (*elt);
5428 /* Java emits line number notes in the top of labels.
5429 ??? Make this go away once line number notes are obsoleted. */
5430 BB_HEAD (bb) = NEXT_INSN (last);
5431 if (NOTE_P (BB_HEAD (bb)))
5432 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5433 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5435 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5437 else
5438 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5440 NOTE_BASIC_BLOCK (note) = bb;
5442 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5444 basic_block new_bb;
5446 stmt = gsi_stmt (gsi);
5448 /* If this statement is a non-debug one, and we generate debug
5449 insns, then this one might be the last real use of a TERed
5450 SSA_NAME, but where there are still some debug uses further
5451 down. Expanding the current SSA name in such further debug
5452 uses by their RHS might lead to wrong debug info, as coalescing
5453 might make the operands of such RHS be placed into the same
5454 pseudo as something else. Like so:
5455 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5456 use(a_1);
5457 a_2 = ...
5458 #DEBUG ... => a_1
5459 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5460 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5461 the write to a_2 would actually have clobbered the place which
5462 formerly held a_0.
5464 So, instead of that, we recognize the situation, and generate
5465 debug temporaries at the last real use of TERed SSA names:
5466 a_1 = a_0 + 1;
5467 #DEBUG #D1 => a_1
5468 use(a_1);
5469 a_2 = ...
5470 #DEBUG ... => #D1
5472 if (MAY_HAVE_DEBUG_INSNS
5473 && SA.values
5474 && !is_gimple_debug (stmt))
5476 ssa_op_iter iter;
5477 tree op;
5478 gimple *def;
5480 location_t sloc = curr_insn_location ();
5482 /* Look for SSA names that have their last use here (TERed
5483 names always have only one real use). */
5484 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5485 if ((def = get_gimple_for_ssa_name (op)))
5487 imm_use_iterator imm_iter;
5488 use_operand_p use_p;
5489 bool have_debug_uses = false;
5491 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5493 if (gimple_debug_bind_p (USE_STMT (use_p)))
5495 have_debug_uses = true;
5496 break;
5500 if (have_debug_uses)
5502 /* OP is a TERed SSA name, with DEF its defining
5503 statement, and where OP is used in further debug
5504 instructions. Generate a debug temporary, and
5505 replace all uses of OP in debug insns with that
5506 temporary. */
5507 gimple *debugstmt;
5508 tree value = gimple_assign_rhs_to_tree (def);
5509 tree vexpr = make_node (DEBUG_EXPR_DECL);
5510 rtx val;
5511 machine_mode mode;
5513 set_curr_insn_location (gimple_location (def));
5515 DECL_ARTIFICIAL (vexpr) = 1;
5516 TREE_TYPE (vexpr) = TREE_TYPE (value);
5517 if (DECL_P (value))
5518 mode = DECL_MODE (value);
5519 else
5520 mode = TYPE_MODE (TREE_TYPE (value));
5521 DECL_MODE (vexpr) = mode;
5523 val = gen_rtx_VAR_LOCATION
5524 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5526 emit_debug_insn (val);
5528 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5530 if (!gimple_debug_bind_p (debugstmt))
5531 continue;
5533 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5534 SET_USE (use_p, vexpr);
5536 update_stmt (debugstmt);
5540 set_curr_insn_location (sloc);
5543 currently_expanding_gimple_stmt = stmt;
5545 /* Expand this statement, then evaluate the resulting RTL and
5546 fixup the CFG accordingly. */
5547 if (gimple_code (stmt) == GIMPLE_COND)
5549 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5550 if (new_bb)
5551 return new_bb;
5553 else if (gimple_debug_bind_p (stmt))
5555 location_t sloc = curr_insn_location ();
5556 gimple_stmt_iterator nsi = gsi;
5558 for (;;)
5560 tree var = gimple_debug_bind_get_var (stmt);
5561 tree value;
5562 rtx val;
5563 machine_mode mode;
5565 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5566 && TREE_CODE (var) != LABEL_DECL
5567 && !target_for_debug_bind (var))
5568 goto delink_debug_stmt;
5570 if (gimple_debug_bind_has_value_p (stmt))
5571 value = gimple_debug_bind_get_value (stmt);
5572 else
5573 value = NULL_TREE;
5575 last = get_last_insn ();
5577 set_curr_insn_location (gimple_location (stmt));
5579 if (DECL_P (var))
5580 mode = DECL_MODE (var);
5581 else
5582 mode = TYPE_MODE (TREE_TYPE (var));
5584 val = gen_rtx_VAR_LOCATION
5585 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5587 emit_debug_insn (val);
5589 if (dump_file && (dump_flags & TDF_DETAILS))
5591 /* We can't dump the insn with a TREE where an RTX
5592 is expected. */
5593 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5594 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5595 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5598 delink_debug_stmt:
5599 /* In order not to generate too many debug temporaries,
5600 we delink all uses of debug statements we already expanded.
5601 Therefore debug statements between definition and real
5602 use of TERed SSA names will continue to use the SSA name,
5603 and not be replaced with debug temps. */
5604 delink_stmt_imm_use (stmt);
5606 gsi = nsi;
5607 gsi_next (&nsi);
5608 if (gsi_end_p (nsi))
5609 break;
5610 stmt = gsi_stmt (nsi);
5611 if (!gimple_debug_bind_p (stmt))
5612 break;
5615 set_curr_insn_location (sloc);
5617 else if (gimple_debug_source_bind_p (stmt))
5619 location_t sloc = curr_insn_location ();
5620 tree var = gimple_debug_source_bind_get_var (stmt);
5621 tree value = gimple_debug_source_bind_get_value (stmt);
5622 rtx val;
5623 machine_mode mode;
5625 last = get_last_insn ();
5627 set_curr_insn_location (gimple_location (stmt));
5629 mode = DECL_MODE (var);
5631 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5632 VAR_INIT_STATUS_UNINITIALIZED);
5634 emit_debug_insn (val);
5636 if (dump_file && (dump_flags & TDF_DETAILS))
5638 /* We can't dump the insn with a TREE where an RTX
5639 is expected. */
5640 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5641 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5642 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5645 set_curr_insn_location (sloc);
5647 else
5649 gcall *call_stmt = dyn_cast <gcall *> (stmt);
5650 if (call_stmt
5651 && gimple_call_tail_p (call_stmt)
5652 && disable_tail_calls)
5653 gimple_call_set_tail (call_stmt, false);
5655 if (call_stmt && gimple_call_tail_p (call_stmt))
5657 bool can_fallthru;
5658 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
5659 if (new_bb)
5661 if (can_fallthru)
5662 bb = new_bb;
5663 else
5664 return new_bb;
5667 else
5669 def_operand_p def_p;
5670 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5672 if (def_p != NULL)
5674 /* Ignore this stmt if it is in the list of
5675 replaceable expressions. */
5676 if (SA.values
5677 && bitmap_bit_p (SA.values,
5678 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5679 continue;
5681 last = expand_gimple_stmt (stmt);
5682 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5687 currently_expanding_gimple_stmt = NULL;
5689 /* Expand implicit goto and convert goto_locus. */
5690 FOR_EACH_EDGE (e, ei, bb->succs)
5692 if (e->goto_locus != UNKNOWN_LOCATION)
5693 set_curr_insn_location (e->goto_locus);
5694 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5696 emit_jump (label_rtx_for_bb (e->dest));
5697 e->flags &= ~EDGE_FALLTHRU;
5701 /* Expanded RTL can create a jump in the last instruction of block.
5702 This later might be assumed to be a jump to successor and break edge insertion.
5703 We need to insert dummy move to prevent this. PR41440. */
5704 if (single_succ_p (bb)
5705 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5706 && (last = get_last_insn ())
5707 && JUMP_P (last))
5709 rtx dummy = gen_reg_rtx (SImode);
5710 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5713 do_pending_stack_adjust ();
5715 /* Find the block tail. The last insn in the block is the insn
5716 before a barrier and/or table jump insn. */
5717 last = get_last_insn ();
5718 if (BARRIER_P (last))
5719 last = PREV_INSN (last);
5720 if (JUMP_TABLE_DATA_P (last))
5721 last = PREV_INSN (PREV_INSN (last));
5722 BB_END (bb) = last;
5724 update_bb_for_insn (bb);
5726 return bb;
5730 /* Create a basic block for initialization code. */
5732 static basic_block
5733 construct_init_block (void)
5735 basic_block init_block, first_block;
5736 edge e = NULL;
5737 int flags;
5739 /* Multiple entry points not supported yet. */
5740 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5741 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5742 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5743 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5744 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5746 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5748 /* When entry edge points to first basic block, we don't need jump,
5749 otherwise we have to jump into proper target. */
5750 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5752 tree label = gimple_block_label (e->dest);
5754 emit_jump (jump_target_rtx (label));
5755 flags = 0;
5757 else
5758 flags = EDGE_FALLTHRU;
5760 init_block = create_basic_block (NEXT_INSN (get_insns ()),
5761 get_last_insn (),
5762 ENTRY_BLOCK_PTR_FOR_FN (cfun));
5763 init_block->frequency = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency;
5764 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5765 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5766 if (e)
5768 first_block = e->dest;
5769 redirect_edge_succ (e, init_block);
5770 e = make_edge (init_block, first_block, flags);
5772 else
5773 e = make_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_FALLTHRU);
5774 e->probability = REG_BR_PROB_BASE;
5775 e->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5777 update_bb_for_insn (init_block);
5778 return init_block;
5781 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
5782 found in the block tree. */
5784 static void
5785 set_block_levels (tree block, int level)
5787 while (block)
5789 BLOCK_NUMBER (block) = level;
5790 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
5791 block = BLOCK_CHAIN (block);
5795 /* Create a block containing landing pads and similar stuff. */
5797 static void
5798 construct_exit_block (void)
5800 rtx_insn *head = get_last_insn ();
5801 rtx_insn *end;
5802 basic_block exit_block;
5803 edge e, e2;
5804 unsigned ix;
5805 edge_iterator ei;
5806 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
5807 rtx_insn *orig_end = BB_END (prev_bb);
5809 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5811 /* Make sure the locus is set to the end of the function, so that
5812 epilogue line numbers and warnings are set properly. */
5813 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
5814 input_location = cfun->function_end_locus;
5816 /* Generate rtl for function exit. */
5817 expand_function_end ();
5819 end = get_last_insn ();
5820 if (head == end)
5821 return;
5822 /* While emitting the function end we could move end of the last basic
5823 block. */
5824 BB_END (prev_bb) = orig_end;
5825 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
5826 head = NEXT_INSN (head);
5827 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
5828 bb frequency counting will be confused. Any instructions before that
5829 label are emitted for the case where PREV_BB falls through into the
5830 exit block, so append those instructions to prev_bb in that case. */
5831 if (NEXT_INSN (head) != return_label)
5833 while (NEXT_INSN (head) != return_label)
5835 if (!NOTE_P (NEXT_INSN (head)))
5836 BB_END (prev_bb) = NEXT_INSN (head);
5837 head = NEXT_INSN (head);
5840 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
5841 exit_block->frequency = EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency;
5842 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5843 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5845 ix = 0;
5846 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
5848 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
5849 if (!(e->flags & EDGE_ABNORMAL))
5850 redirect_edge_succ (e, exit_block);
5851 else
5852 ix++;
5855 e = make_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_FALLTHRU);
5856 e->probability = REG_BR_PROB_BASE;
5857 e->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5858 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
5859 if (e2 != e)
5861 e->count -= e2->count;
5862 exit_block->count -= e2->count;
5863 exit_block->frequency -= EDGE_FREQUENCY (e2);
5865 if (e->count < 0)
5866 e->count = 0;
5867 if (exit_block->count < 0)
5868 exit_block->count = 0;
5869 if (exit_block->frequency < 0)
5870 exit_block->frequency = 0;
5871 update_bb_for_insn (exit_block);
5874 /* Helper function for discover_nonconstant_array_refs.
5875 Look for ARRAY_REF nodes with non-constant indexes and mark them
5876 addressable. */
5878 static tree
5879 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
5880 void *data ATTRIBUTE_UNUSED)
5882 tree t = *tp;
5884 if (IS_TYPE_OR_DECL_P (t))
5885 *walk_subtrees = 0;
5886 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5888 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5889 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
5890 && (!TREE_OPERAND (t, 2)
5891 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5892 || (TREE_CODE (t) == COMPONENT_REF
5893 && (!TREE_OPERAND (t,2)
5894 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5895 || TREE_CODE (t) == BIT_FIELD_REF
5896 || TREE_CODE (t) == REALPART_EXPR
5897 || TREE_CODE (t) == IMAGPART_EXPR
5898 || TREE_CODE (t) == VIEW_CONVERT_EXPR
5899 || CONVERT_EXPR_P (t))
5900 t = TREE_OPERAND (t, 0);
5902 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5904 t = get_base_address (t);
5905 if (t && DECL_P (t)
5906 && DECL_MODE (t) != BLKmode)
5907 TREE_ADDRESSABLE (t) = 1;
5910 *walk_subtrees = 0;
5913 return NULL_TREE;
5916 /* RTL expansion is not able to compile array references with variable
5917 offsets for arrays stored in single register. Discover such
5918 expressions and mark variables as addressable to avoid this
5919 scenario. */
5921 static void
5922 discover_nonconstant_array_refs (void)
5924 basic_block bb;
5925 gimple_stmt_iterator gsi;
5927 FOR_EACH_BB_FN (bb, cfun)
5928 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
5930 gimple *stmt = gsi_stmt (gsi);
5931 if (!is_gimple_debug (stmt))
5932 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
5936 /* This function sets crtl->args.internal_arg_pointer to a virtual
5937 register if DRAP is needed. Local register allocator will replace
5938 virtual_incoming_args_rtx with the virtual register. */
5940 static void
5941 expand_stack_alignment (void)
5943 rtx drap_rtx;
5944 unsigned int preferred_stack_boundary;
5946 if (! SUPPORTS_STACK_ALIGNMENT)
5947 return;
5949 if (cfun->calls_alloca
5950 || cfun->has_nonlocal_label
5951 || crtl->has_nonlocal_goto)
5952 crtl->need_drap = true;
5954 /* Call update_stack_boundary here again to update incoming stack
5955 boundary. It may set incoming stack alignment to a different
5956 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
5957 use the minimum incoming stack alignment to check if it is OK
5958 to perform sibcall optimization since sibcall optimization will
5959 only align the outgoing stack to incoming stack boundary. */
5960 if (targetm.calls.update_stack_boundary)
5961 targetm.calls.update_stack_boundary ();
5963 /* The incoming stack frame has to be aligned at least at
5964 parm_stack_boundary. */
5965 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
5967 /* Update crtl->stack_alignment_estimated and use it later to align
5968 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
5969 exceptions since callgraph doesn't collect incoming stack alignment
5970 in this case. */
5971 if (cfun->can_throw_non_call_exceptions
5972 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
5973 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
5974 else
5975 preferred_stack_boundary = crtl->preferred_stack_boundary;
5976 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
5977 crtl->stack_alignment_estimated = preferred_stack_boundary;
5978 if (preferred_stack_boundary > crtl->stack_alignment_needed)
5979 crtl->stack_alignment_needed = preferred_stack_boundary;
5981 gcc_assert (crtl->stack_alignment_needed
5982 <= crtl->stack_alignment_estimated);
5984 crtl->stack_realign_needed
5985 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
5986 crtl->stack_realign_tried = crtl->stack_realign_needed;
5988 crtl->stack_realign_processed = true;
5990 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
5991 alignment. */
5992 gcc_assert (targetm.calls.get_drap_rtx != NULL);
5993 drap_rtx = targetm.calls.get_drap_rtx ();
5995 /* stack_realign_drap and drap_rtx must match. */
5996 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
5998 /* Do nothing if NULL is returned, which means DRAP is not needed. */
5999 if (NULL != drap_rtx)
6001 crtl->args.internal_arg_pointer = drap_rtx;
6003 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6004 needed. */
6005 fixup_tail_calls ();
6010 static void
6011 expand_main_function (void)
6013 #if (defined(INVOKE__main) \
6014 || (!defined(HAS_INIT_SECTION) \
6015 && !defined(INIT_SECTION_ASM_OP) \
6016 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6017 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode, 0);
6018 #endif
6022 /* Expand code to initialize the stack_protect_guard. This is invoked at
6023 the beginning of a function to be protected. */
6025 static void
6026 stack_protect_prologue (void)
6028 tree guard_decl = targetm.stack_protect_guard ();
6029 rtx x, y;
6031 x = expand_normal (crtl->stack_protect_guard);
6032 y = expand_normal (guard_decl);
6034 /* Allow the target to copy from Y to X without leaking Y into a
6035 register. */
6036 if (targetm.have_stack_protect_set ())
6037 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6039 emit_insn (insn);
6040 return;
6043 /* Otherwise do a straight move. */
6044 emit_move_insn (x, y);
6047 /* Translate the intermediate representation contained in the CFG
6048 from GIMPLE trees to RTL.
6050 We do conversion per basic block and preserve/update the tree CFG.
6051 This implies we have to do some magic as the CFG can simultaneously
6052 consist of basic blocks containing RTL and GIMPLE trees. This can
6053 confuse the CFG hooks, so be careful to not manipulate CFG during
6054 the expansion. */
6056 namespace {
6058 const pass_data pass_data_expand =
6060 RTL_PASS, /* type */
6061 "expand", /* name */
6062 OPTGROUP_NONE, /* optinfo_flags */
6063 TV_EXPAND, /* tv_id */
6064 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6065 | PROP_gimple_lcx
6066 | PROP_gimple_lvec
6067 | PROP_gimple_lva), /* properties_required */
6068 PROP_rtl, /* properties_provided */
6069 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
6070 0, /* todo_flags_start */
6071 0, /* todo_flags_finish */
6074 class pass_expand : public rtl_opt_pass
6076 public:
6077 pass_expand (gcc::context *ctxt)
6078 : rtl_opt_pass (pass_data_expand, ctxt)
6081 /* opt_pass methods: */
6082 virtual unsigned int execute (function *);
6084 }; // class pass_expand
6086 unsigned int
6087 pass_expand::execute (function *fun)
6089 basic_block bb, init_block;
6090 sbitmap blocks;
6091 edge_iterator ei;
6092 edge e;
6093 rtx_insn *var_seq, *var_ret_seq;
6094 unsigned i;
6096 timevar_push (TV_OUT_OF_SSA);
6097 rewrite_out_of_ssa (&SA);
6098 timevar_pop (TV_OUT_OF_SSA);
6099 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6101 if (MAY_HAVE_DEBUG_STMTS && flag_tree_ter)
6103 gimple_stmt_iterator gsi;
6104 FOR_EACH_BB_FN (bb, cfun)
6105 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6106 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6107 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6110 /* Make sure all values used by the optimization passes have sane
6111 defaults. */
6112 reg_renumber = 0;
6114 /* Some backends want to know that we are expanding to RTL. */
6115 currently_expanding_to_rtl = 1;
6116 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6117 free_dominance_info (CDI_DOMINATORS);
6119 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6121 if (chkp_function_instrumented_p (current_function_decl))
6122 chkp_reset_rtl_bounds ();
6124 insn_locations_init ();
6125 if (!DECL_IS_BUILTIN (current_function_decl))
6127 /* Eventually, all FEs should explicitly set function_start_locus. */
6128 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6129 set_curr_insn_location
6130 (DECL_SOURCE_LOCATION (current_function_decl));
6131 else
6132 set_curr_insn_location (fun->function_start_locus);
6134 else
6135 set_curr_insn_location (UNKNOWN_LOCATION);
6136 prologue_location = curr_insn_location ();
6138 #ifdef INSN_SCHEDULING
6139 init_sched_attrs ();
6140 #endif
6142 /* Make sure first insn is a note even if we don't want linenums.
6143 This makes sure the first insn will never be deleted.
6144 Also, final expects a note to appear there. */
6145 emit_note (NOTE_INSN_DELETED);
6147 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6148 discover_nonconstant_array_refs ();
6150 targetm.expand_to_rtl_hook ();
6151 crtl->stack_alignment_needed = STACK_BOUNDARY;
6152 crtl->max_used_stack_slot_alignment = STACK_BOUNDARY;
6153 crtl->stack_alignment_estimated = 0;
6154 crtl->preferred_stack_boundary = STACK_BOUNDARY;
6155 fun->cfg->max_jumptable_ents = 0;
6157 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6158 of the function section at exapnsion time to predict distance of calls. */
6159 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6161 /* Expand the variables recorded during gimple lowering. */
6162 timevar_push (TV_VAR_EXPAND);
6163 start_sequence ();
6165 var_ret_seq = expand_used_vars ();
6167 var_seq = get_insns ();
6168 end_sequence ();
6169 timevar_pop (TV_VAR_EXPAND);
6171 /* Honor stack protection warnings. */
6172 if (warn_stack_protect)
6174 if (fun->calls_alloca)
6175 warning (OPT_Wstack_protector,
6176 "stack protector not protecting local variables: "
6177 "variable length buffer");
6178 if (has_short_buffer && !crtl->stack_protect_guard)
6179 warning (OPT_Wstack_protector,
6180 "stack protector not protecting function: "
6181 "all local arrays are less than %d bytes long",
6182 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE));
6185 /* Set up parameters and prepare for return, for the function. */
6186 expand_function_start (current_function_decl);
6188 /* If we emitted any instructions for setting up the variables,
6189 emit them before the FUNCTION_START note. */
6190 if (var_seq)
6192 emit_insn_before (var_seq, parm_birth_insn);
6194 /* In expand_function_end we'll insert the alloca save/restore
6195 before parm_birth_insn. We've just insertted an alloca call.
6196 Adjust the pointer to match. */
6197 parm_birth_insn = var_seq;
6200 /* Now propagate the RTL assignment of each partition to the
6201 underlying var of each SSA_NAME. */
6202 for (i = 1; i < num_ssa_names; i++)
6204 tree name = ssa_name (i);
6206 if (!name
6207 /* We might have generated new SSA names in
6208 update_alias_info_with_stack_vars. They will have a NULL
6209 defining statements, and won't be part of the partitioning,
6210 so ignore those. */
6211 || !SSA_NAME_DEF_STMT (name))
6212 continue;
6214 adjust_one_expanded_partition_var (name);
6217 /* Clean up RTL of variables that straddle across multiple
6218 partitions, and check that the rtl of any PARM_DECLs that are not
6219 cleaned up is that of their default defs. */
6220 for (i = 1; i < num_ssa_names; i++)
6222 tree name = ssa_name (i);
6223 int part;
6225 if (!name
6226 /* We might have generated new SSA names in
6227 update_alias_info_with_stack_vars. They will have a NULL
6228 defining statements, and won't be part of the partitioning,
6229 so ignore those. */
6230 || !SSA_NAME_DEF_STMT (name))
6231 continue;
6232 part = var_to_partition (SA.map, name);
6233 if (part == NO_PARTITION)
6234 continue;
6236 /* If this decl was marked as living in multiple places, reset
6237 this now to NULL. */
6238 tree var = SSA_NAME_VAR (name);
6239 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6240 SET_DECL_RTL (var, NULL);
6241 /* Check that the pseudos chosen by assign_parms are those of
6242 the corresponding default defs. */
6243 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6244 && (TREE_CODE (var) == PARM_DECL
6245 || TREE_CODE (var) == RESULT_DECL))
6247 rtx in = DECL_RTL_IF_SET (var);
6248 gcc_assert (in);
6249 rtx out = SA.partition_to_pseudo[part];
6250 gcc_assert (in == out);
6252 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6253 those expected by debug backends for each parm and for
6254 the result. This is particularly important for stabs,
6255 whose register elimination from parm's DECL_RTL may cause
6256 -fcompare-debug differences as SET_DECL_RTL changes reg's
6257 attrs. So, make sure the RTL already has the parm as the
6258 EXPR, so that it won't change. */
6259 SET_DECL_RTL (var, NULL_RTX);
6260 if (MEM_P (in))
6261 set_mem_attributes (in, var, true);
6262 SET_DECL_RTL (var, in);
6266 /* If this function is `main', emit a call to `__main'
6267 to run global initializers, etc. */
6268 if (DECL_NAME (current_function_decl)
6269 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6270 && DECL_FILE_SCOPE_P (current_function_decl))
6271 expand_main_function ();
6273 /* Initialize the stack_protect_guard field. This must happen after the
6274 call to __main (if any) so that the external decl is initialized. */
6275 if (crtl->stack_protect_guard)
6276 stack_protect_prologue ();
6278 expand_phi_nodes (&SA);
6280 /* Register rtl specific functions for cfg. */
6281 rtl_register_cfg_hooks ();
6283 init_block = construct_init_block ();
6285 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6286 remaining edges later. */
6287 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6288 e->flags &= ~EDGE_EXECUTABLE;
6290 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6291 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6292 next_bb)
6293 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6295 if (MAY_HAVE_DEBUG_INSNS)
6296 expand_debug_locations ();
6298 if (deep_ter_debug_map)
6300 delete deep_ter_debug_map;
6301 deep_ter_debug_map = NULL;
6304 /* Free stuff we no longer need after GIMPLE optimizations. */
6305 free_dominance_info (CDI_DOMINATORS);
6306 free_dominance_info (CDI_POST_DOMINATORS);
6307 delete_tree_cfg_annotations ();
6309 timevar_push (TV_OUT_OF_SSA);
6310 finish_out_of_ssa (&SA);
6311 timevar_pop (TV_OUT_OF_SSA);
6313 timevar_push (TV_POST_EXPAND);
6314 /* We are no longer in SSA form. */
6315 fun->gimple_df->in_ssa_p = false;
6316 loops_state_clear (LOOP_CLOSED_SSA);
6318 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6319 conservatively to true until they are all profile aware. */
6320 delete lab_rtx_for_bb;
6321 free_histograms ();
6323 construct_exit_block ();
6324 insn_locations_finalize ();
6326 if (var_ret_seq)
6328 rtx_insn *after = return_label;
6329 rtx_insn *next = NEXT_INSN (after);
6330 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6331 after = next;
6332 emit_insn_after (var_ret_seq, after);
6335 /* Zap the tree EH table. */
6336 set_eh_throw_stmt_table (fun, NULL);
6338 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6339 split edges which edge insertions might do. */
6340 rebuild_jump_labels (get_insns ());
6342 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun),
6343 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6345 edge e;
6346 edge_iterator ei;
6347 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6349 if (e->insns.r)
6351 rebuild_jump_labels_chain (e->insns.r);
6352 /* Put insns after parm birth, but before
6353 NOTE_INSNS_FUNCTION_BEG. */
6354 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (fun)
6355 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6357 rtx_insn *insns = e->insns.r;
6358 e->insns.r = NULL;
6359 if (NOTE_P (parm_birth_insn)
6360 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6361 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6362 else
6363 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6365 else
6366 commit_one_edge_insertion (e);
6368 else
6369 ei_next (&ei);
6373 /* We're done expanding trees to RTL. */
6374 currently_expanding_to_rtl = 0;
6376 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6377 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6379 edge e;
6380 edge_iterator ei;
6381 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6383 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6384 e->flags &= ~EDGE_EXECUTABLE;
6386 /* At the moment not all abnormal edges match the RTL
6387 representation. It is safe to remove them here as
6388 find_many_sub_basic_blocks will rediscover them.
6389 In the future we should get this fixed properly. */
6390 if ((e->flags & EDGE_ABNORMAL)
6391 && !(e->flags & EDGE_SIBCALL))
6392 remove_edge (e);
6393 else
6394 ei_next (&ei);
6398 blocks = sbitmap_alloc (last_basic_block_for_fn (fun));
6399 bitmap_ones (blocks);
6400 find_many_sub_basic_blocks (blocks);
6401 sbitmap_free (blocks);
6402 purge_all_dead_edges ();
6404 expand_stack_alignment ();
6406 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6407 function. */
6408 if (crtl->tail_call_emit)
6409 fixup_tail_calls ();
6411 /* After initial rtl generation, call back to finish generating
6412 exception support code. We need to do this before cleaning up
6413 the CFG as the code does not expect dead landing pads. */
6414 if (fun->eh->region_tree != NULL)
6415 finish_eh_generation ();
6417 /* Remove unreachable blocks, otherwise we cannot compute dominators
6418 which are needed for loop state verification. As a side-effect
6419 this also compacts blocks.
6420 ??? We cannot remove trivially dead insns here as for example
6421 the DRAP reg on i?86 is not magically live at this point.
6422 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6423 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6425 #ifdef ENABLE_CHECKING
6426 verify_flow_info ();
6427 #endif
6429 /* Initialize pseudos allocated for hard registers. */
6430 emit_initial_value_sets ();
6432 /* And finally unshare all RTL. */
6433 unshare_all_rtl ();
6435 /* There's no need to defer outputting this function any more; we
6436 know we want to output it. */
6437 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6439 /* Now that we're done expanding trees to RTL, we shouldn't have any
6440 more CONCATs anywhere. */
6441 generating_concat_p = 0;
6443 if (dump_file)
6445 fprintf (dump_file,
6446 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6447 /* And the pass manager will dump RTL for us. */
6450 /* If we're emitting a nested function, make sure its parent gets
6451 emitted as well. Doing otherwise confuses debug info. */
6453 tree parent;
6454 for (parent = DECL_CONTEXT (current_function_decl);
6455 parent != NULL_TREE;
6456 parent = get_containing_scope (parent))
6457 if (TREE_CODE (parent) == FUNCTION_DECL)
6458 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6461 /* We are now committed to emitting code for this function. Do any
6462 preparation, such as emitting abstract debug info for the inline
6463 before it gets mangled by optimization. */
6464 if (cgraph_function_possibly_inlined_p (current_function_decl))
6465 (*debug_hooks->outlining_inline_function) (current_function_decl);
6467 TREE_ASM_WRITTEN (current_function_decl) = 1;
6469 /* After expanding, the return labels are no longer needed. */
6470 return_label = NULL;
6471 naked_return_label = NULL;
6473 /* After expanding, the tm_restart map is no longer needed. */
6474 if (fun->gimple_df->tm_restart)
6475 fun->gimple_df->tm_restart = NULL;
6477 /* Tag the blocks with a depth number so that change_scope can find
6478 the common parent easily. */
6479 set_block_levels (DECL_INITIAL (fun->decl), 0);
6480 default_rtl_profile ();
6482 timevar_pop (TV_POST_EXPAND);
6484 return 0;
6487 } // anon namespace
6489 rtl_opt_pass *
6490 make_pass_expand (gcc::context *ctxt)
6492 return new pass_expand (ctxt);