testsuite: localclass2 require LTO
[official-gcc.git] / gcc / cfgexpand.c
blob1df6f4bc55a39230c98e58af6c2d765652db8324
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2020 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "target.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "cfghooks.h"
29 #include "tree-pass.h"
30 #include "memmodel.h"
31 #include "tm_p.h"
32 #include "ssa.h"
33 #include "optabs.h"
34 #include "regs.h" /* For reg_renumber. */
35 #include "emit-rtl.h"
36 #include "recog.h"
37 #include "cgraph.h"
38 #include "diagnostic.h"
39 #include "fold-const.h"
40 #include "varasm.h"
41 #include "stor-layout.h"
42 #include "stmt.h"
43 #include "print-tree.h"
44 #include "cfgrtl.h"
45 #include "cfganal.h"
46 #include "cfgbuild.h"
47 #include "cfgcleanup.h"
48 #include "dojump.h"
49 #include "explow.h"
50 #include "calls.h"
51 #include "expr.h"
52 #include "internal-fn.h"
53 #include "tree-eh.h"
54 #include "gimple-iterator.h"
55 #include "gimple-expr.h"
56 #include "gimple-walk.h"
57 #include "tree-cfg.h"
58 #include "tree-dfa.h"
59 #include "tree-ssa.h"
60 #include "except.h"
61 #include "gimple-pretty-print.h"
62 #include "toplev.h"
63 #include "debug.h"
64 #include "tree-inline.h"
65 #include "value-prof.h"
66 #include "tree-ssa-live.h"
67 #include "tree-outof-ssa.h"
68 #include "cfgloop.h"
69 #include "insn-attr.h" /* For INSN_SCHEDULING. */
70 #include "stringpool.h"
71 #include "attribs.h"
72 #include "asan.h"
73 #include "tree-ssa-address.h"
74 #include "output.h"
75 #include "builtins.h"
77 /* Some systems use __main in a way incompatible with its use in gcc, in these
78 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
79 give the same symbol without quotes for an alternative entry point. You
80 must define both, or neither. */
81 #ifndef NAME__MAIN
82 #define NAME__MAIN "__main"
83 #endif
85 /* This variable holds information helping the rewriting of SSA trees
86 into RTL. */
87 struct ssaexpand SA;
89 /* This variable holds the currently expanded gimple statement for purposes
90 of comminucating the profile info to the builtin expanders. */
91 gimple *currently_expanding_gimple_stmt;
93 static rtx expand_debug_expr (tree);
95 static bool defer_stack_allocation (tree, bool);
97 static void record_alignment_for_reg_var (unsigned int);
99 /* Return an expression tree corresponding to the RHS of GIMPLE
100 statement STMT. */
102 tree
103 gimple_assign_rhs_to_tree (gimple *stmt)
105 tree t;
106 switch (gimple_assign_rhs_class (stmt))
108 case GIMPLE_TERNARY_RHS:
109 t = build3 (gimple_assign_rhs_code (stmt),
110 TREE_TYPE (gimple_assign_lhs (stmt)),
111 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt),
112 gimple_assign_rhs3 (stmt));
113 break;
114 case GIMPLE_BINARY_RHS:
115 t = build2 (gimple_assign_rhs_code (stmt),
116 TREE_TYPE (gimple_assign_lhs (stmt)),
117 gimple_assign_rhs1 (stmt), gimple_assign_rhs2 (stmt));
118 break;
119 case GIMPLE_UNARY_RHS:
120 t = build1 (gimple_assign_rhs_code (stmt),
121 TREE_TYPE (gimple_assign_lhs (stmt)),
122 gimple_assign_rhs1 (stmt));
123 break;
124 case GIMPLE_SINGLE_RHS:
126 t = gimple_assign_rhs1 (stmt);
127 /* Avoid modifying this tree in place below. */
128 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
129 && gimple_location (stmt) != EXPR_LOCATION (t))
130 || (gimple_block (stmt) && currently_expanding_to_rtl
131 && EXPR_P (t)))
132 t = copy_node (t);
133 break;
135 default:
136 gcc_unreachable ();
139 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
140 SET_EXPR_LOCATION (t, gimple_location (stmt));
142 return t;
146 #ifndef STACK_ALIGNMENT_NEEDED
147 #define STACK_ALIGNMENT_NEEDED 1
148 #endif
150 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
152 /* Choose either CUR or NEXT as the leader DECL for a partition.
153 Prefer ignored decls, to simplify debug dumps and reduce ambiguity
154 out of the same user variable being in multiple partitions (this is
155 less likely for compiler-introduced temps). */
157 static tree
158 leader_merge (tree cur, tree next)
160 if (cur == NULL || cur == next)
161 return next;
163 if (DECL_P (cur) && DECL_IGNORED_P (cur))
164 return cur;
166 if (DECL_P (next) && DECL_IGNORED_P (next))
167 return next;
169 return cur;
172 /* Associate declaration T with storage space X. If T is no
173 SSA name this is exactly SET_DECL_RTL, otherwise make the
174 partition of T associated with X. */
175 static inline void
176 set_rtl (tree t, rtx x)
178 gcc_checking_assert (!x
179 || !(TREE_CODE (t) == SSA_NAME || is_gimple_reg (t))
180 || (use_register_for_decl (t)
181 ? (REG_P (x)
182 || (GET_CODE (x) == CONCAT
183 && (REG_P (XEXP (x, 0))
184 || SUBREG_P (XEXP (x, 0)))
185 && (REG_P (XEXP (x, 1))
186 || SUBREG_P (XEXP (x, 1))))
187 /* We need to accept PARALLELs for RESUT_DECLs
188 because of vector types with BLKmode returned
189 in multiple registers, but they are supposed
190 to be uncoalesced. */
191 || (GET_CODE (x) == PARALLEL
192 && SSAVAR (t)
193 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
194 && (GET_MODE (x) == BLKmode
195 || !flag_tree_coalesce_vars)))
196 : (MEM_P (x) || x == pc_rtx
197 || (GET_CODE (x) == CONCAT
198 && MEM_P (XEXP (x, 0))
199 && MEM_P (XEXP (x, 1))))));
200 /* Check that the RTL for SSA_NAMEs and gimple-reg PARM_DECLs and
201 RESULT_DECLs has the expected mode. For memory, we accept
202 unpromoted modes, since that's what we're likely to get. For
203 PARM_DECLs and RESULT_DECLs, we'll have been called by
204 set_parm_rtl, which will give us the default def, so we don't
205 have to compute it ourselves. For RESULT_DECLs, we accept mode
206 mismatches too, as long as we have BLKmode or are not coalescing
207 across variables, so that we don't reject BLKmode PARALLELs or
208 unpromoted REGs. */
209 gcc_checking_assert (!x || x == pc_rtx || TREE_CODE (t) != SSA_NAME
210 || (SSAVAR (t)
211 && TREE_CODE (SSAVAR (t)) == RESULT_DECL
212 && (promote_ssa_mode (t, NULL) == BLKmode
213 || !flag_tree_coalesce_vars))
214 || !use_register_for_decl (t)
215 || GET_MODE (x) == promote_ssa_mode (t, NULL));
217 if (x)
219 bool skip = false;
220 tree cur = NULL_TREE;
221 rtx xm = x;
223 retry:
224 if (MEM_P (xm))
225 cur = MEM_EXPR (xm);
226 else if (REG_P (xm))
227 cur = REG_EXPR (xm);
228 else if (SUBREG_P (xm))
230 gcc_assert (subreg_lowpart_p (xm));
231 xm = SUBREG_REG (xm);
232 goto retry;
234 else if (GET_CODE (xm) == CONCAT)
236 xm = XEXP (xm, 0);
237 goto retry;
239 else if (GET_CODE (xm) == PARALLEL)
241 xm = XVECEXP (xm, 0, 0);
242 gcc_assert (GET_CODE (xm) == EXPR_LIST);
243 xm = XEXP (xm, 0);
244 goto retry;
246 else if (xm == pc_rtx)
247 skip = true;
248 else
249 gcc_unreachable ();
251 tree next = skip ? cur : leader_merge (cur, SSAVAR (t) ? SSAVAR (t) : t);
253 if (cur != next)
255 if (MEM_P (x))
256 set_mem_attributes (x,
257 next && TREE_CODE (next) == SSA_NAME
258 ? TREE_TYPE (next)
259 : next, true);
260 else
261 set_reg_attrs_for_decl_rtl (next, x);
265 if (TREE_CODE (t) == SSA_NAME)
267 int part = var_to_partition (SA.map, t);
268 if (part != NO_PARTITION)
270 if (SA.partition_to_pseudo[part])
271 gcc_assert (SA.partition_to_pseudo[part] == x);
272 else if (x != pc_rtx)
273 SA.partition_to_pseudo[part] = x;
275 /* For the benefit of debug information at -O0 (where
276 vartracking doesn't run) record the place also in the base
277 DECL. For PARMs and RESULTs, do so only when setting the
278 default def. */
279 if (x && x != pc_rtx && SSA_NAME_VAR (t)
280 && (VAR_P (SSA_NAME_VAR (t))
281 || SSA_NAME_IS_DEFAULT_DEF (t)))
283 tree var = SSA_NAME_VAR (t);
284 /* If we don't yet have something recorded, just record it now. */
285 if (!DECL_RTL_SET_P (var))
286 SET_DECL_RTL (var, x);
287 /* If we have it set already to "multiple places" don't
288 change this. */
289 else if (DECL_RTL (var) == pc_rtx)
291 /* If we have something recorded and it's not the same place
292 as we want to record now, we have multiple partitions for the
293 same base variable, with different places. We can't just
294 randomly chose one, hence we have to say that we don't know.
295 This only happens with optimization, and there var-tracking
296 will figure out the right thing. */
297 else if (DECL_RTL (var) != x)
298 SET_DECL_RTL (var, pc_rtx);
301 else
302 SET_DECL_RTL (t, x);
305 /* This structure holds data relevant to one variable that will be
306 placed in a stack slot. */
307 class stack_var
309 public:
310 /* The Variable. */
311 tree decl;
313 /* Initially, the size of the variable. Later, the size of the partition,
314 if this variable becomes it's partition's representative. */
315 poly_uint64 size;
317 /* The *byte* alignment required for this variable. Or as, with the
318 size, the alignment for this partition. */
319 unsigned int alignb;
321 /* The partition representative. */
322 size_t representative;
324 /* The next stack variable in the partition, or EOC. */
325 size_t next;
327 /* The numbers of conflicting stack variables. */
328 bitmap conflicts;
331 #define EOC ((size_t)-1)
333 /* We have an array of such objects while deciding allocation. */
334 static class stack_var *stack_vars;
335 static size_t stack_vars_alloc;
336 static size_t stack_vars_num;
337 static hash_map<tree, size_t> *decl_to_stack_part;
339 /* Conflict bitmaps go on this obstack. This allows us to destroy
340 all of them in one big sweep. */
341 static bitmap_obstack stack_var_bitmap_obstack;
343 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
344 is non-decreasing. */
345 static size_t *stack_vars_sorted;
347 /* The phase of the stack frame. This is the known misalignment of
348 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
349 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
350 static int frame_phase;
352 /* Used during expand_used_vars to remember if we saw any decls for
353 which we'd like to enable stack smashing protection. */
354 static bool has_protected_decls;
356 /* Used during expand_used_vars. Remember if we say a character buffer
357 smaller than our cutoff threshold. Used for -Wstack-protector. */
358 static bool has_short_buffer;
360 /* Compute the byte alignment to use for DECL. Ignore alignment
361 we can't do with expected alignment of the stack boundary. */
363 static unsigned int
364 align_local_variable (tree decl, bool really_expand)
366 unsigned int align;
368 if (TREE_CODE (decl) == SSA_NAME)
370 tree type = TREE_TYPE (decl);
371 machine_mode mode = TYPE_MODE (type);
373 align = TYPE_ALIGN (type);
374 if (mode != BLKmode
375 && align < GET_MODE_ALIGNMENT (mode))
376 align = GET_MODE_ALIGNMENT (mode);
378 else
380 align = LOCAL_DECL_ALIGNMENT (decl);
381 /* Don't change DECL_ALIGN when called from estimated_stack_frame_size.
382 That is done before IPA and could bump alignment based on host
383 backend even for offloaded code which wants different
384 LOCAL_DECL_ALIGNMENT. */
385 if (really_expand)
386 SET_DECL_ALIGN (decl, align);
388 return align / BITS_PER_UNIT;
391 /* Align given offset BASE with ALIGN. Truncate up if ALIGN_UP is true,
392 down otherwise. Return truncated BASE value. */
394 static inline unsigned HOST_WIDE_INT
395 align_base (HOST_WIDE_INT base, unsigned HOST_WIDE_INT align, bool align_up)
397 return align_up ? (base + align - 1) & -align : base & -align;
400 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
401 Return the frame offset. */
403 static poly_int64
404 alloc_stack_frame_space (poly_int64 size, unsigned HOST_WIDE_INT align)
406 poly_int64 offset, new_frame_offset;
408 if (FRAME_GROWS_DOWNWARD)
410 new_frame_offset
411 = aligned_lower_bound (frame_offset - frame_phase - size,
412 align) + frame_phase;
413 offset = new_frame_offset;
415 else
417 new_frame_offset
418 = aligned_upper_bound (frame_offset - frame_phase,
419 align) + frame_phase;
420 offset = new_frame_offset;
421 new_frame_offset += size;
423 frame_offset = new_frame_offset;
425 if (frame_offset_overflow (frame_offset, cfun->decl))
426 frame_offset = offset = 0;
428 return offset;
431 /* Accumulate DECL into STACK_VARS. */
433 static void
434 add_stack_var (tree decl, bool really_expand)
436 class stack_var *v;
438 if (stack_vars_num >= stack_vars_alloc)
440 if (stack_vars_alloc)
441 stack_vars_alloc = stack_vars_alloc * 3 / 2;
442 else
443 stack_vars_alloc = 32;
444 stack_vars
445 = XRESIZEVEC (class stack_var, stack_vars, stack_vars_alloc);
447 if (!decl_to_stack_part)
448 decl_to_stack_part = new hash_map<tree, size_t>;
450 v = &stack_vars[stack_vars_num];
451 decl_to_stack_part->put (decl, stack_vars_num);
453 v->decl = decl;
454 tree size = TREE_CODE (decl) == SSA_NAME
455 ? TYPE_SIZE_UNIT (TREE_TYPE (decl))
456 : DECL_SIZE_UNIT (decl);
457 v->size = tree_to_poly_uint64 (size);
458 /* Ensure that all variables have size, so that &a != &b for any two
459 variables that are simultaneously live. */
460 if (known_eq (v->size, 0U))
461 v->size = 1;
462 v->alignb = align_local_variable (decl, really_expand);
463 /* An alignment of zero can mightily confuse us later. */
464 gcc_assert (v->alignb != 0);
466 /* All variables are initially in their own partition. */
467 v->representative = stack_vars_num;
468 v->next = EOC;
470 /* All variables initially conflict with no other. */
471 v->conflicts = NULL;
473 /* Ensure that this decl doesn't get put onto the list twice. */
474 set_rtl (decl, pc_rtx);
476 stack_vars_num++;
479 /* Make the decls associated with luid's X and Y conflict. */
481 static void
482 add_stack_var_conflict (size_t x, size_t y)
484 class stack_var *a = &stack_vars[x];
485 class stack_var *b = &stack_vars[y];
486 if (x == y)
487 return;
488 if (!a->conflicts)
489 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
490 if (!b->conflicts)
491 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
492 bitmap_set_bit (a->conflicts, y);
493 bitmap_set_bit (b->conflicts, x);
496 /* Check whether the decls associated with luid's X and Y conflict. */
498 static bool
499 stack_var_conflict_p (size_t x, size_t y)
501 class stack_var *a = &stack_vars[x];
502 class stack_var *b = &stack_vars[y];
503 if (x == y)
504 return false;
505 /* Partitions containing an SSA name result from gimple registers
506 with things like unsupported modes. They are top-level and
507 hence conflict with everything else. */
508 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
509 return true;
511 if (!a->conflicts || !b->conflicts)
512 return false;
513 return bitmap_bit_p (a->conflicts, y);
516 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
517 enter its partition number into bitmap DATA. */
519 static bool
520 visit_op (gimple *, tree op, tree, void *data)
522 bitmap active = (bitmap)data;
523 op = get_base_address (op);
524 if (op
525 && DECL_P (op)
526 && DECL_RTL_IF_SET (op) == pc_rtx)
528 size_t *v = decl_to_stack_part->get (op);
529 if (v)
530 bitmap_set_bit (active, *v);
532 return false;
535 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
536 record conflicts between it and all currently active other partitions
537 from bitmap DATA. */
539 static bool
540 visit_conflict (gimple *, tree op, tree, void *data)
542 bitmap active = (bitmap)data;
543 op = get_base_address (op);
544 if (op
545 && DECL_P (op)
546 && DECL_RTL_IF_SET (op) == pc_rtx)
548 size_t *v = decl_to_stack_part->get (op);
549 if (v && bitmap_set_bit (active, *v))
551 size_t num = *v;
552 bitmap_iterator bi;
553 unsigned i;
554 gcc_assert (num < stack_vars_num);
555 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
556 add_stack_var_conflict (num, i);
559 return false;
562 /* Helper routine for add_scope_conflicts, calculating the active partitions
563 at the end of BB, leaving the result in WORK. We're called to generate
564 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
565 liveness. */
567 static void
568 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
570 edge e;
571 edge_iterator ei;
572 gimple_stmt_iterator gsi;
573 walk_stmt_load_store_addr_fn visit;
575 bitmap_clear (work);
576 FOR_EACH_EDGE (e, ei, bb->preds)
577 bitmap_ior_into (work, (bitmap)e->src->aux);
579 visit = visit_op;
581 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
583 gimple *stmt = gsi_stmt (gsi);
584 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
586 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
588 gimple *stmt = gsi_stmt (gsi);
590 if (gimple_clobber_p (stmt))
592 tree lhs = gimple_assign_lhs (stmt);
593 size_t *v;
594 /* Nested function lowering might introduce LHSs
595 that are COMPONENT_REFs. */
596 if (!VAR_P (lhs))
597 continue;
598 if (DECL_RTL_IF_SET (lhs) == pc_rtx
599 && (v = decl_to_stack_part->get (lhs)))
600 bitmap_clear_bit (work, *v);
602 else if (!is_gimple_debug (stmt))
604 if (for_conflict
605 && visit == visit_op)
607 /* If this is the first real instruction in this BB we need
608 to add conflicts for everything live at this point now.
609 Unlike classical liveness for named objects we can't
610 rely on seeing a def/use of the names we're interested in.
611 There might merely be indirect loads/stores. We'd not add any
612 conflicts for such partitions. */
613 bitmap_iterator bi;
614 unsigned i;
615 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
617 class stack_var *a = &stack_vars[i];
618 if (!a->conflicts)
619 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
620 bitmap_ior_into (a->conflicts, work);
622 visit = visit_conflict;
624 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
629 /* Generate stack partition conflicts between all partitions that are
630 simultaneously live. */
632 static void
633 add_scope_conflicts (void)
635 basic_block bb;
636 bool changed;
637 bitmap work = BITMAP_ALLOC (NULL);
638 int *rpo;
639 int n_bbs;
641 /* We approximate the live range of a stack variable by taking the first
642 mention of its name as starting point(s), and by the end-of-scope
643 death clobber added by gimplify as ending point(s) of the range.
644 This overapproximates in the case we for instance moved an address-taken
645 operation upward, without also moving a dereference to it upwards.
646 But it's conservatively correct as a variable never can hold values
647 before its name is mentioned at least once.
649 We then do a mostly classical bitmap liveness algorithm. */
651 FOR_ALL_BB_FN (bb, cfun)
652 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
654 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
655 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
657 changed = true;
658 while (changed)
660 int i;
661 changed = false;
662 for (i = 0; i < n_bbs; i++)
664 bitmap active;
665 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
666 active = (bitmap)bb->aux;
667 add_scope_conflicts_1 (bb, work, false);
668 if (bitmap_ior_into (active, work))
669 changed = true;
673 FOR_EACH_BB_FN (bb, cfun)
674 add_scope_conflicts_1 (bb, work, true);
676 free (rpo);
677 BITMAP_FREE (work);
678 FOR_ALL_BB_FN (bb, cfun)
679 BITMAP_FREE (bb->aux);
682 /* A subroutine of partition_stack_vars. A comparison function for qsort,
683 sorting an array of indices by the properties of the object. */
685 static int
686 stack_var_cmp (const void *a, const void *b)
688 size_t ia = *(const size_t *)a;
689 size_t ib = *(const size_t *)b;
690 unsigned int aligna = stack_vars[ia].alignb;
691 unsigned int alignb = stack_vars[ib].alignb;
692 poly_int64 sizea = stack_vars[ia].size;
693 poly_int64 sizeb = stack_vars[ib].size;
694 tree decla = stack_vars[ia].decl;
695 tree declb = stack_vars[ib].decl;
696 bool largea, largeb;
697 unsigned int uida, uidb;
699 /* Primary compare on "large" alignment. Large comes first. */
700 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
701 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
702 if (largea != largeb)
703 return (int)largeb - (int)largea;
705 /* Secondary compare on size, decreasing */
706 int diff = compare_sizes_for_sort (sizeb, sizea);
707 if (diff != 0)
708 return diff;
710 /* Tertiary compare on true alignment, decreasing. */
711 if (aligna < alignb)
712 return -1;
713 if (aligna > alignb)
714 return 1;
716 /* Final compare on ID for sort stability, increasing.
717 Two SSA names are compared by their version, SSA names come before
718 non-SSA names, and two normal decls are compared by their DECL_UID. */
719 if (TREE_CODE (decla) == SSA_NAME)
721 if (TREE_CODE (declb) == SSA_NAME)
722 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
723 else
724 return -1;
726 else if (TREE_CODE (declb) == SSA_NAME)
727 return 1;
728 else
729 uida = DECL_UID (decla), uidb = DECL_UID (declb);
730 if (uida < uidb)
731 return 1;
732 if (uida > uidb)
733 return -1;
734 return 0;
737 struct part_traits : unbounded_int_hashmap_traits <size_t, bitmap> {};
738 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
740 /* If the points-to solution *PI points to variables that are in a partition
741 together with other variables add all partition members to the pointed-to
742 variables bitmap. */
744 static void
745 add_partitioned_vars_to_ptset (struct pt_solution *pt,
746 part_hashmap *decls_to_partitions,
747 hash_set<bitmap> *visited, bitmap temp)
749 bitmap_iterator bi;
750 unsigned i;
751 bitmap *part;
753 if (pt->anything
754 || pt->vars == NULL
755 /* The pointed-to vars bitmap is shared, it is enough to
756 visit it once. */
757 || visited->add (pt->vars))
758 return;
760 bitmap_clear (temp);
762 /* By using a temporary bitmap to store all members of the partitions
763 we have to add we make sure to visit each of the partitions only
764 once. */
765 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
766 if ((!temp
767 || !bitmap_bit_p (temp, i))
768 && (part = decls_to_partitions->get (i)))
769 bitmap_ior_into (temp, *part);
770 if (!bitmap_empty_p (temp))
771 bitmap_ior_into (pt->vars, temp);
774 /* Update points-to sets based on partition info, so we can use them on RTL.
775 The bitmaps representing stack partitions will be saved until expand,
776 where partitioned decls used as bases in memory expressions will be
777 rewritten. */
779 static void
780 update_alias_info_with_stack_vars (void)
782 part_hashmap *decls_to_partitions = NULL;
783 size_t i, j;
784 tree var = NULL_TREE;
786 for (i = 0; i < stack_vars_num; i++)
788 bitmap part = NULL;
789 tree name;
790 struct ptr_info_def *pi;
792 /* Not interested in partitions with single variable. */
793 if (stack_vars[i].representative != i
794 || stack_vars[i].next == EOC)
795 continue;
797 if (!decls_to_partitions)
799 decls_to_partitions = new part_hashmap;
800 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
803 /* Create an SSA_NAME that points to the partition for use
804 as base during alias-oracle queries on RTL for bases that
805 have been partitioned. */
806 if (var == NULL_TREE)
807 var = create_tmp_var (ptr_type_node);
808 name = make_ssa_name (var);
810 /* Create bitmaps representing partitions. They will be used for
811 points-to sets later, so use GGC alloc. */
812 part = BITMAP_GGC_ALLOC ();
813 for (j = i; j != EOC; j = stack_vars[j].next)
815 tree decl = stack_vars[j].decl;
816 unsigned int uid = DECL_PT_UID (decl);
817 bitmap_set_bit (part, uid);
818 decls_to_partitions->put (uid, part);
819 cfun->gimple_df->decls_to_pointers->put (decl, name);
820 if (TREE_ADDRESSABLE (decl))
821 TREE_ADDRESSABLE (name) = 1;
824 /* Make the SSA name point to all partition members. */
825 pi = get_ptr_info (name);
826 pt_solution_set (&pi->pt, part, false);
829 /* Make all points-to sets that contain one member of a partition
830 contain all members of the partition. */
831 if (decls_to_partitions)
833 unsigned i;
834 tree name;
835 hash_set<bitmap> visited;
836 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
838 FOR_EACH_SSA_NAME (i, name, cfun)
840 struct ptr_info_def *pi;
842 if (POINTER_TYPE_P (TREE_TYPE (name))
843 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
844 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
845 &visited, temp);
848 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
849 decls_to_partitions, &visited, temp);
851 delete decls_to_partitions;
852 BITMAP_FREE (temp);
856 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
857 partitioning algorithm. Partitions A and B are known to be non-conflicting.
858 Merge them into a single partition A. */
860 static void
861 union_stack_vars (size_t a, size_t b)
863 class stack_var *vb = &stack_vars[b];
864 bitmap_iterator bi;
865 unsigned u;
867 gcc_assert (stack_vars[b].next == EOC);
868 /* Add B to A's partition. */
869 stack_vars[b].next = stack_vars[a].next;
870 stack_vars[b].representative = a;
871 stack_vars[a].next = b;
873 /* Make sure A is big enough to hold B. */
874 stack_vars[a].size = upper_bound (stack_vars[a].size, stack_vars[b].size);
876 /* Update the required alignment of partition A to account for B. */
877 if (stack_vars[a].alignb < stack_vars[b].alignb)
878 stack_vars[a].alignb = stack_vars[b].alignb;
880 /* Update the interference graph and merge the conflicts. */
881 if (vb->conflicts)
883 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
884 add_stack_var_conflict (a, stack_vars[u].representative);
885 BITMAP_FREE (vb->conflicts);
889 /* A subroutine of expand_used_vars. Binpack the variables into
890 partitions constrained by the interference graph. The overall
891 algorithm used is as follows:
893 Sort the objects by size in descending order.
894 For each object A {
895 S = size(A)
896 O = 0
897 loop {
898 Look for the largest non-conflicting object B with size <= S.
899 UNION (A, B)
904 static void
905 partition_stack_vars (void)
907 size_t si, sj, n = stack_vars_num;
909 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
910 for (si = 0; si < n; ++si)
911 stack_vars_sorted[si] = si;
913 if (n == 1)
914 return;
916 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
918 for (si = 0; si < n; ++si)
920 size_t i = stack_vars_sorted[si];
921 unsigned int ialign = stack_vars[i].alignb;
922 poly_int64 isize = stack_vars[i].size;
924 /* Ignore objects that aren't partition representatives. If we
925 see a var that is not a partition representative, it must
926 have been merged earlier. */
927 if (stack_vars[i].representative != i)
928 continue;
930 for (sj = si + 1; sj < n; ++sj)
932 size_t j = stack_vars_sorted[sj];
933 unsigned int jalign = stack_vars[j].alignb;
934 poly_int64 jsize = stack_vars[j].size;
936 /* Ignore objects that aren't partition representatives. */
937 if (stack_vars[j].representative != j)
938 continue;
940 /* Do not mix objects of "small" (supported) alignment
941 and "large" (unsupported) alignment. */
942 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
943 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
944 break;
946 /* For Address Sanitizer do not mix objects with different
947 sizes, as the shorter vars wouldn't be adequately protected.
948 Don't do that for "large" (unsupported) alignment objects,
949 those aren't protected anyway. */
950 if (asan_sanitize_stack_p ()
951 && maybe_ne (isize, jsize)
952 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
953 break;
955 /* Ignore conflicting objects. */
956 if (stack_var_conflict_p (i, j))
957 continue;
959 /* UNION the objects, placing J at OFFSET. */
960 union_stack_vars (i, j);
964 update_alias_info_with_stack_vars ();
967 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
969 static void
970 dump_stack_var_partition (void)
972 size_t si, i, j, n = stack_vars_num;
974 for (si = 0; si < n; ++si)
976 i = stack_vars_sorted[si];
978 /* Skip variables that aren't partition representatives, for now. */
979 if (stack_vars[i].representative != i)
980 continue;
982 fprintf (dump_file, "Partition %lu: size ", (unsigned long) i);
983 print_dec (stack_vars[i].size, dump_file);
984 fprintf (dump_file, " align %u\n", stack_vars[i].alignb);
986 for (j = i; j != EOC; j = stack_vars[j].next)
988 fputc ('\t', dump_file);
989 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
991 fputc ('\n', dump_file);
995 /* Assign rtl to DECL at BASE + OFFSET. */
997 static void
998 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
999 poly_int64 offset)
1001 unsigned align;
1002 rtx x;
1004 /* If this fails, we've overflowed the stack frame. Error nicely? */
1005 gcc_assert (known_eq (offset, trunc_int_for_mode (offset, Pmode)));
1007 x = plus_constant (Pmode, base, offset);
1008 x = gen_rtx_MEM (TREE_CODE (decl) == SSA_NAME
1009 ? TYPE_MODE (TREE_TYPE (decl))
1010 : DECL_MODE (decl), x);
1012 /* Set alignment we actually gave this decl if it isn't an SSA name.
1013 If it is we generate stack slots only accidentally so it isn't as
1014 important, we'll simply set the alignment directly on the MEM. */
1016 if (base == virtual_stack_vars_rtx)
1017 offset -= frame_phase;
1018 align = known_alignment (offset);
1019 align *= BITS_PER_UNIT;
1020 if (align == 0 || align > base_align)
1021 align = base_align;
1023 if (TREE_CODE (decl) != SSA_NAME)
1025 /* One would think that we could assert that we're not decreasing
1026 alignment here, but (at least) the i386 port does exactly this
1027 via the MINIMUM_ALIGNMENT hook. */
1029 SET_DECL_ALIGN (decl, align);
1030 DECL_USER_ALIGN (decl) = 0;
1033 set_rtl (decl, x);
1035 set_mem_align (x, align);
1038 class stack_vars_data
1040 public:
1041 /* Vector of offset pairs, always end of some padding followed
1042 by start of the padding that needs Address Sanitizer protection.
1043 The vector is in reversed, highest offset pairs come first. */
1044 auto_vec<HOST_WIDE_INT> asan_vec;
1046 /* Vector of partition representative decls in between the paddings. */
1047 auto_vec<tree> asan_decl_vec;
1049 /* Base pseudo register for Address Sanitizer protected automatic vars. */
1050 rtx asan_base;
1052 /* Alignment needed for the Address Sanitizer protected automatic vars. */
1053 unsigned int asan_alignb;
1056 /* A subroutine of expand_used_vars. Give each partition representative
1057 a unique location within the stack frame. Update each partition member
1058 with that location. */
1060 static void
1061 expand_stack_vars (bool (*pred) (size_t), class stack_vars_data *data)
1063 size_t si, i, j, n = stack_vars_num;
1064 poly_uint64 large_size = 0, large_alloc = 0;
1065 rtx large_base = NULL;
1066 unsigned large_align = 0;
1067 bool large_allocation_done = false;
1068 tree decl;
1070 /* Determine if there are any variables requiring "large" alignment.
1071 Since these are dynamically allocated, we only process these if
1072 no predicate involved. */
1073 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
1074 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
1076 /* Find the total size of these variables. */
1077 for (si = 0; si < n; ++si)
1079 unsigned alignb;
1081 i = stack_vars_sorted[si];
1082 alignb = stack_vars[i].alignb;
1084 /* All "large" alignment decls come before all "small" alignment
1085 decls, but "large" alignment decls are not sorted based on
1086 their alignment. Increase large_align to track the largest
1087 required alignment. */
1088 if ((alignb * BITS_PER_UNIT) > large_align)
1089 large_align = alignb * BITS_PER_UNIT;
1091 /* Stop when we get to the first decl with "small" alignment. */
1092 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1093 break;
1095 /* Skip variables that aren't partition representatives. */
1096 if (stack_vars[i].representative != i)
1097 continue;
1099 /* Skip variables that have already had rtl assigned. See also
1100 add_stack_var where we perpetrate this pc_rtx hack. */
1101 decl = stack_vars[i].decl;
1102 if (TREE_CODE (decl) == SSA_NAME
1103 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1104 : DECL_RTL (decl) != pc_rtx)
1105 continue;
1107 large_size = aligned_upper_bound (large_size, alignb);
1108 large_size += stack_vars[i].size;
1112 for (si = 0; si < n; ++si)
1114 rtx base;
1115 unsigned base_align, alignb;
1116 poly_int64 offset;
1118 i = stack_vars_sorted[si];
1120 /* Skip variables that aren't partition representatives, for now. */
1121 if (stack_vars[i].representative != i)
1122 continue;
1124 /* Skip variables that have already had rtl assigned. See also
1125 add_stack_var where we perpetrate this pc_rtx hack. */
1126 decl = stack_vars[i].decl;
1127 if (TREE_CODE (decl) == SSA_NAME
1128 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)] != NULL_RTX
1129 : DECL_RTL (decl) != pc_rtx)
1130 continue;
1132 /* Check the predicate to see whether this variable should be
1133 allocated in this pass. */
1134 if (pred && !pred (i))
1135 continue;
1137 alignb = stack_vars[i].alignb;
1138 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
1140 base = virtual_stack_vars_rtx;
1141 /* ASAN description strings don't yet have a syntax for expressing
1142 polynomial offsets. */
1143 HOST_WIDE_INT prev_offset;
1144 if (asan_sanitize_stack_p ()
1145 && pred
1146 && frame_offset.is_constant (&prev_offset)
1147 && stack_vars[i].size.is_constant ())
1149 if (data->asan_vec.is_empty ())
1151 alloc_stack_frame_space (0, ASAN_RED_ZONE_SIZE);
1152 prev_offset = frame_offset.to_constant ();
1154 prev_offset = align_base (prev_offset,
1155 ASAN_MIN_RED_ZONE_SIZE,
1156 !FRAME_GROWS_DOWNWARD);
1157 tree repr_decl = NULL_TREE;
1158 unsigned HOST_WIDE_INT size
1159 = asan_var_and_redzone_size (stack_vars[i].size.to_constant ());
1160 if (data->asan_vec.is_empty ())
1161 size = MAX (size, ASAN_RED_ZONE_SIZE);
1163 unsigned HOST_WIDE_INT alignment = MAX (alignb,
1164 ASAN_MIN_RED_ZONE_SIZE);
1165 offset = alloc_stack_frame_space (size, alignment);
1167 data->asan_vec.safe_push (prev_offset);
1168 /* Allocating a constant amount of space from a constant
1169 starting offset must give a constant result. */
1170 data->asan_vec.safe_push ((offset + stack_vars[i].size)
1171 .to_constant ());
1172 /* Find best representative of the partition.
1173 Prefer those with DECL_NAME, even better
1174 satisfying asan_protect_stack_decl predicate. */
1175 for (j = i; j != EOC; j = stack_vars[j].next)
1176 if (asan_protect_stack_decl (stack_vars[j].decl)
1177 && DECL_NAME (stack_vars[j].decl))
1179 repr_decl = stack_vars[j].decl;
1180 break;
1182 else if (repr_decl == NULL_TREE
1183 && DECL_P (stack_vars[j].decl)
1184 && DECL_NAME (stack_vars[j].decl))
1185 repr_decl = stack_vars[j].decl;
1186 if (repr_decl == NULL_TREE)
1187 repr_decl = stack_vars[i].decl;
1188 data->asan_decl_vec.safe_push (repr_decl);
1190 /* Make sure a representative is unpoison if another
1191 variable in the partition is handled by
1192 use-after-scope sanitization. */
1193 if (asan_handled_variables != NULL
1194 && !asan_handled_variables->contains (repr_decl))
1196 for (j = i; j != EOC; j = stack_vars[j].next)
1197 if (asan_handled_variables->contains (stack_vars[j].decl))
1198 break;
1199 if (j != EOC)
1200 asan_handled_variables->add (repr_decl);
1203 data->asan_alignb = MAX (data->asan_alignb, alignb);
1204 if (data->asan_base == NULL)
1205 data->asan_base = gen_reg_rtx (Pmode);
1206 base = data->asan_base;
1208 if (!STRICT_ALIGNMENT)
1209 base_align = crtl->max_used_stack_slot_alignment;
1210 else
1211 base_align = MAX (crtl->max_used_stack_slot_alignment,
1212 GET_MODE_ALIGNMENT (SImode)
1213 << ASAN_SHADOW_SHIFT);
1215 else
1217 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1218 base_align = crtl->max_used_stack_slot_alignment;
1221 else
1223 /* Large alignment is only processed in the last pass. */
1224 if (pred)
1225 continue;
1227 /* If there were any variables requiring "large" alignment, allocate
1228 space. */
1229 if (maybe_ne (large_size, 0U) && ! large_allocation_done)
1231 poly_int64 loffset;
1232 rtx large_allocsize;
1234 large_allocsize = gen_int_mode (large_size, Pmode);
1235 get_dynamic_stack_size (&large_allocsize, 0, large_align, NULL);
1236 loffset = alloc_stack_frame_space
1237 (rtx_to_poly_int64 (large_allocsize),
1238 PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT);
1239 large_base = get_dynamic_stack_base (loffset, large_align);
1240 large_allocation_done = true;
1242 gcc_assert (large_base != NULL);
1244 large_alloc = aligned_upper_bound (large_alloc, alignb);
1245 offset = large_alloc;
1246 large_alloc += stack_vars[i].size;
1248 base = large_base;
1249 base_align = large_align;
1252 /* Create rtl for each variable based on their location within the
1253 partition. */
1254 for (j = i; j != EOC; j = stack_vars[j].next)
1256 expand_one_stack_var_at (stack_vars[j].decl,
1257 base, base_align,
1258 offset);
1262 gcc_assert (known_eq (large_alloc, large_size));
1265 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1266 static poly_uint64
1267 account_stack_vars (void)
1269 size_t si, j, i, n = stack_vars_num;
1270 poly_uint64 size = 0;
1272 for (si = 0; si < n; ++si)
1274 i = stack_vars_sorted[si];
1276 /* Skip variables that aren't partition representatives, for now. */
1277 if (stack_vars[i].representative != i)
1278 continue;
1280 size += stack_vars[i].size;
1281 for (j = i; j != EOC; j = stack_vars[j].next)
1282 set_rtl (stack_vars[j].decl, NULL);
1284 return size;
1287 /* Record the RTL assignment X for the default def of PARM. */
1289 extern void
1290 set_parm_rtl (tree parm, rtx x)
1292 gcc_assert (TREE_CODE (parm) == PARM_DECL
1293 || TREE_CODE (parm) == RESULT_DECL);
1295 if (x && !MEM_P (x))
1297 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (parm),
1298 TYPE_MODE (TREE_TYPE (parm)),
1299 TYPE_ALIGN (TREE_TYPE (parm)));
1301 /* If the variable alignment is very large we'll dynamicaly
1302 allocate it, which means that in-frame portion is just a
1303 pointer. ??? We've got a pseudo for sure here, do we
1304 actually dynamically allocate its spilling area if needed?
1305 ??? Isn't it a problem when Pmode alignment also exceeds
1306 MAX_SUPPORTED_STACK_ALIGNMENT, as can happen on cris and lm32? */
1307 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1308 align = GET_MODE_ALIGNMENT (Pmode);
1310 record_alignment_for_reg_var (align);
1313 tree ssa = ssa_default_def (cfun, parm);
1314 if (!ssa)
1315 return set_rtl (parm, x);
1317 int part = var_to_partition (SA.map, ssa);
1318 gcc_assert (part != NO_PARTITION);
1320 bool changed = bitmap_bit_p (SA.partitions_for_parm_default_defs, part);
1321 gcc_assert (changed);
1323 set_rtl (ssa, x);
1324 gcc_assert (DECL_RTL (parm) == x);
1327 /* A subroutine of expand_one_var. Called to immediately assign rtl
1328 to a variable to be allocated in the stack frame. */
1330 static void
1331 expand_one_stack_var_1 (tree var)
1333 poly_uint64 size;
1334 poly_int64 offset;
1335 unsigned byte_align;
1337 if (TREE_CODE (var) == SSA_NAME)
1339 tree type = TREE_TYPE (var);
1340 size = tree_to_poly_uint64 (TYPE_SIZE_UNIT (type));
1342 else
1343 size = tree_to_poly_uint64 (DECL_SIZE_UNIT (var));
1345 byte_align = align_local_variable (var, true);
1347 /* We handle highly aligned variables in expand_stack_vars. */
1348 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1350 offset = alloc_stack_frame_space (size, byte_align);
1352 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1353 crtl->max_used_stack_slot_alignment, offset);
1356 /* Wrapper for expand_one_stack_var_1 that checks SSA_NAMEs are
1357 already assigned some MEM. */
1359 static void
1360 expand_one_stack_var (tree var)
1362 if (TREE_CODE (var) == SSA_NAME)
1364 int part = var_to_partition (SA.map, var);
1365 if (part != NO_PARTITION)
1367 rtx x = SA.partition_to_pseudo[part];
1368 gcc_assert (x);
1369 gcc_assert (MEM_P (x));
1370 return;
1374 return expand_one_stack_var_1 (var);
1377 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1378 that will reside in a hard register. */
1380 static void
1381 expand_one_hard_reg_var (tree var)
1383 rest_of_decl_compilation (var, 0, 0);
1386 /* Record the alignment requirements of some variable assigned to a
1387 pseudo. */
1389 static void
1390 record_alignment_for_reg_var (unsigned int align)
1392 if (SUPPORTS_STACK_ALIGNMENT
1393 && crtl->stack_alignment_estimated < align)
1395 /* stack_alignment_estimated shouldn't change after stack
1396 realign decision made */
1397 gcc_assert (!crtl->stack_realign_processed);
1398 crtl->stack_alignment_estimated = align;
1401 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1402 So here we only make sure stack_alignment_needed >= align. */
1403 if (crtl->stack_alignment_needed < align)
1404 crtl->stack_alignment_needed = align;
1405 if (crtl->max_used_stack_slot_alignment < align)
1406 crtl->max_used_stack_slot_alignment = align;
1409 /* Create RTL for an SSA partition. */
1411 static void
1412 expand_one_ssa_partition (tree var)
1414 int part = var_to_partition (SA.map, var);
1415 gcc_assert (part != NO_PARTITION);
1417 if (SA.partition_to_pseudo[part])
1418 return;
1420 unsigned int align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1421 TYPE_MODE (TREE_TYPE (var)),
1422 TYPE_ALIGN (TREE_TYPE (var)));
1424 /* If the variable alignment is very large we'll dynamicaly allocate
1425 it, which means that in-frame portion is just a pointer. */
1426 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1427 align = GET_MODE_ALIGNMENT (Pmode);
1429 record_alignment_for_reg_var (align);
1431 if (!use_register_for_decl (var))
1433 if (defer_stack_allocation (var, true))
1434 add_stack_var (var, true);
1435 else
1436 expand_one_stack_var_1 (var);
1437 return;
1440 machine_mode reg_mode = promote_ssa_mode (var, NULL);
1441 rtx x = gen_reg_rtx (reg_mode);
1443 set_rtl (var, x);
1445 /* For a promoted variable, X will not be used directly but wrapped in a
1446 SUBREG with SUBREG_PROMOTED_VAR_P set, which means that the RTL land
1447 will assume that its upper bits can be inferred from its lower bits.
1448 Therefore, if X isn't initialized on every path from the entry, then
1449 we must do it manually in order to fulfill the above assumption. */
1450 if (reg_mode != TYPE_MODE (TREE_TYPE (var))
1451 && bitmap_bit_p (SA.partitions_for_undefined_values, part))
1452 emit_move_insn (x, CONST0_RTX (reg_mode));
1455 /* Record the association between the RTL generated for partition PART
1456 and the underlying variable of the SSA_NAME VAR. */
1458 static void
1459 adjust_one_expanded_partition_var (tree var)
1461 if (!var)
1462 return;
1464 tree decl = SSA_NAME_VAR (var);
1466 int part = var_to_partition (SA.map, var);
1467 if (part == NO_PARTITION)
1468 return;
1470 rtx x = SA.partition_to_pseudo[part];
1472 gcc_assert (x);
1474 set_rtl (var, x);
1476 if (!REG_P (x))
1477 return;
1479 /* Note if the object is a user variable. */
1480 if (decl && !DECL_ARTIFICIAL (decl))
1481 mark_user_reg (x);
1483 if (POINTER_TYPE_P (decl ? TREE_TYPE (decl) : TREE_TYPE (var)))
1484 mark_reg_pointer (x, get_pointer_alignment (var));
1487 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1488 that will reside in a pseudo register. */
1490 static void
1491 expand_one_register_var (tree var)
1493 if (TREE_CODE (var) == SSA_NAME)
1495 int part = var_to_partition (SA.map, var);
1496 if (part != NO_PARTITION)
1498 rtx x = SA.partition_to_pseudo[part];
1499 gcc_assert (x);
1500 gcc_assert (REG_P (x));
1501 return;
1503 gcc_unreachable ();
1506 tree decl = var;
1507 tree type = TREE_TYPE (decl);
1508 machine_mode reg_mode = promote_decl_mode (decl, NULL);
1509 rtx x = gen_reg_rtx (reg_mode);
1511 set_rtl (var, x);
1513 /* Note if the object is a user variable. */
1514 if (!DECL_ARTIFICIAL (decl))
1515 mark_user_reg (x);
1517 if (POINTER_TYPE_P (type))
1518 mark_reg_pointer (x, get_pointer_alignment (var));
1521 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1522 has some associated error, e.g. its type is error-mark. We just need
1523 to pick something that won't crash the rest of the compiler. */
1525 static void
1526 expand_one_error_var (tree var)
1528 machine_mode mode = DECL_MODE (var);
1529 rtx x;
1531 if (mode == BLKmode)
1532 x = gen_rtx_MEM (BLKmode, const0_rtx);
1533 else if (mode == VOIDmode)
1534 x = const0_rtx;
1535 else
1536 x = gen_reg_rtx (mode);
1538 SET_DECL_RTL (var, x);
1541 /* A subroutine of expand_one_var. VAR is a variable that will be
1542 allocated to the local stack frame. Return true if we wish to
1543 add VAR to STACK_VARS so that it will be coalesced with other
1544 variables. Return false to allocate VAR immediately.
1546 This function is used to reduce the number of variables considered
1547 for coalescing, which reduces the size of the quadratic problem. */
1549 static bool
1550 defer_stack_allocation (tree var, bool toplevel)
1552 tree size_unit = TREE_CODE (var) == SSA_NAME
1553 ? TYPE_SIZE_UNIT (TREE_TYPE (var))
1554 : DECL_SIZE_UNIT (var);
1555 poly_uint64 size;
1557 /* Whether the variable is small enough for immediate allocation not to be
1558 a problem with regard to the frame size. */
1559 bool smallish
1560 = (poly_int_tree_p (size_unit, &size)
1561 && (estimated_poly_value (size)
1562 < param_min_size_for_stack_sharing));
1564 /* If stack protection is enabled, *all* stack variables must be deferred,
1565 so that we can re-order the strings to the top of the frame.
1566 Similarly for Address Sanitizer. */
1567 if (flag_stack_protect || asan_sanitize_stack_p ())
1568 return true;
1570 unsigned int align = TREE_CODE (var) == SSA_NAME
1571 ? TYPE_ALIGN (TREE_TYPE (var))
1572 : DECL_ALIGN (var);
1574 /* We handle "large" alignment via dynamic allocation. We want to handle
1575 this extra complication in only one place, so defer them. */
1576 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1577 return true;
1579 bool ignored = TREE_CODE (var) == SSA_NAME
1580 ? !SSAVAR (var) || DECL_IGNORED_P (SSA_NAME_VAR (var))
1581 : DECL_IGNORED_P (var);
1583 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1584 might be detached from their block and appear at toplevel when we reach
1585 here. We want to coalesce them with variables from other blocks when
1586 the immediate contribution to the frame size would be noticeable. */
1587 if (toplevel && optimize > 0 && ignored && !smallish)
1588 return true;
1590 /* Variables declared in the outermost scope automatically conflict
1591 with every other variable. The only reason to want to defer them
1592 at all is that, after sorting, we can more efficiently pack
1593 small variables in the stack frame. Continue to defer at -O2. */
1594 if (toplevel && optimize < 2)
1595 return false;
1597 /* Without optimization, *most* variables are allocated from the
1598 stack, which makes the quadratic problem large exactly when we
1599 want compilation to proceed as quickly as possible. On the
1600 other hand, we don't want the function's stack frame size to
1601 get completely out of hand. So we avoid adding scalars and
1602 "small" aggregates to the list at all. */
1603 if (optimize == 0 && smallish)
1604 return false;
1606 return true;
1609 /* A subroutine of expand_used_vars. Expand one variable according to
1610 its flavor. Variables to be placed on the stack are not actually
1611 expanded yet, merely recorded.
1612 When REALLY_EXPAND is false, only add stack values to be allocated.
1613 Return stack usage this variable is supposed to take.
1616 static poly_uint64
1617 expand_one_var (tree var, bool toplevel, bool really_expand)
1619 unsigned int align = BITS_PER_UNIT;
1620 tree origvar = var;
1622 var = SSAVAR (var);
1624 if (TREE_TYPE (var) != error_mark_node && VAR_P (var))
1626 if (is_global_var (var))
1627 return 0;
1629 /* Because we don't know if VAR will be in register or on stack,
1630 we conservatively assume it will be on stack even if VAR is
1631 eventually put into register after RA pass. For non-automatic
1632 variables, which won't be on stack, we collect alignment of
1633 type and ignore user specified alignment. Similarly for
1634 SSA_NAMEs for which use_register_for_decl returns true. */
1635 if (TREE_STATIC (var)
1636 || DECL_EXTERNAL (var)
1637 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1638 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1639 TYPE_MODE (TREE_TYPE (var)),
1640 TYPE_ALIGN (TREE_TYPE (var)));
1641 else if (DECL_HAS_VALUE_EXPR_P (var)
1642 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1643 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1644 or variables which were assigned a stack slot already by
1645 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1646 changed from the offset chosen to it. */
1647 align = crtl->stack_alignment_estimated;
1648 else
1649 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1651 /* If the variable alignment is very large we'll dynamicaly allocate
1652 it, which means that in-frame portion is just a pointer. */
1653 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1654 align = GET_MODE_ALIGNMENT (Pmode);
1657 record_alignment_for_reg_var (align);
1659 poly_uint64 size;
1660 if (TREE_CODE (origvar) == SSA_NAME)
1662 gcc_assert (!VAR_P (var)
1663 || (!DECL_EXTERNAL (var)
1664 && !DECL_HAS_VALUE_EXPR_P (var)
1665 && !TREE_STATIC (var)
1666 && TREE_TYPE (var) != error_mark_node
1667 && !DECL_HARD_REGISTER (var)
1668 && really_expand));
1670 if (!VAR_P (var) && TREE_CODE (origvar) != SSA_NAME)
1672 else if (DECL_EXTERNAL (var))
1674 else if (DECL_HAS_VALUE_EXPR_P (var))
1676 else if (TREE_STATIC (var))
1678 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1680 else if (TREE_TYPE (var) == error_mark_node)
1682 if (really_expand)
1683 expand_one_error_var (var);
1685 else if (VAR_P (var) && DECL_HARD_REGISTER (var))
1687 if (really_expand)
1689 expand_one_hard_reg_var (var);
1690 if (!DECL_HARD_REGISTER (var))
1691 /* Invalid register specification. */
1692 expand_one_error_var (var);
1695 else if (use_register_for_decl (var))
1697 if (really_expand)
1698 expand_one_register_var (origvar);
1700 else if (!poly_int_tree_p (DECL_SIZE_UNIT (var), &size)
1701 || !valid_constant_size_p (DECL_SIZE_UNIT (var)))
1703 /* Reject variables which cover more than half of the address-space. */
1704 if (really_expand)
1706 if (DECL_NONLOCAL_FRAME (var))
1707 error_at (DECL_SOURCE_LOCATION (current_function_decl),
1708 "total size of local objects is too large");
1709 else
1710 error_at (DECL_SOURCE_LOCATION (var),
1711 "size of variable %q+D is too large", var);
1712 expand_one_error_var (var);
1715 else if (defer_stack_allocation (var, toplevel))
1716 add_stack_var (origvar, really_expand);
1717 else
1719 if (really_expand)
1721 if (lookup_attribute ("naked",
1722 DECL_ATTRIBUTES (current_function_decl)))
1723 error ("cannot allocate stack for variable %q+D, naked function",
1724 var);
1726 expand_one_stack_var (origvar);
1728 return size;
1730 return 0;
1733 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1734 expanding variables. Those variables that can be put into registers
1735 are allocated pseudos; those that can't are put on the stack.
1737 TOPLEVEL is true if this is the outermost BLOCK. */
1739 static void
1740 expand_used_vars_for_block (tree block, bool toplevel)
1742 tree t;
1744 /* Expand all variables at this level. */
1745 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1746 if (TREE_USED (t)
1747 && ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1748 || !DECL_NONSHAREABLE (t)))
1749 expand_one_var (t, toplevel, true);
1751 /* Expand all variables at containing levels. */
1752 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1753 expand_used_vars_for_block (t, false);
1756 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1757 and clear TREE_USED on all local variables. */
1759 static void
1760 clear_tree_used (tree block)
1762 tree t;
1764 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1765 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1766 if ((!VAR_P (t) && TREE_CODE (t) != RESULT_DECL)
1767 || !DECL_NONSHAREABLE (t))
1768 TREE_USED (t) = 0;
1770 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1771 clear_tree_used (t);
1774 /* Examine TYPE and determine a bit mask of the following features. */
1776 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1777 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1778 #define SPCT_HAS_ARRAY 4
1779 #define SPCT_HAS_AGGREGATE 8
1781 static unsigned int
1782 stack_protect_classify_type (tree type)
1784 unsigned int ret = 0;
1785 tree t;
1787 switch (TREE_CODE (type))
1789 case ARRAY_TYPE:
1790 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1791 if (t == char_type_node
1792 || t == signed_char_type_node
1793 || t == unsigned_char_type_node)
1795 unsigned HOST_WIDE_INT max = param_ssp_buffer_size;
1796 unsigned HOST_WIDE_INT len;
1798 if (!TYPE_SIZE_UNIT (type)
1799 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1800 len = max;
1801 else
1802 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1804 if (len < max)
1805 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1806 else
1807 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1809 else
1810 ret = SPCT_HAS_ARRAY;
1811 break;
1813 case UNION_TYPE:
1814 case QUAL_UNION_TYPE:
1815 case RECORD_TYPE:
1816 ret = SPCT_HAS_AGGREGATE;
1817 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1818 if (TREE_CODE (t) == FIELD_DECL)
1819 ret |= stack_protect_classify_type (TREE_TYPE (t));
1820 break;
1822 default:
1823 break;
1826 return ret;
1829 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1830 part of the local stack frame. Remember if we ever return nonzero for
1831 any variable in this function. The return value is the phase number in
1832 which the variable should be allocated. */
1834 static int
1835 stack_protect_decl_phase (tree decl)
1837 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1838 int ret = 0;
1840 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1841 has_short_buffer = true;
1843 tree attribs = DECL_ATTRIBUTES (current_function_decl);
1844 if (!lookup_attribute ("no_stack_protector", attribs)
1845 && (flag_stack_protect == SPCT_FLAG_ALL
1846 || flag_stack_protect == SPCT_FLAG_STRONG
1847 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
1848 && lookup_attribute ("stack_protect", attribs))))
1850 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1851 && !(bits & SPCT_HAS_AGGREGATE))
1852 ret = 1;
1853 else if (bits & SPCT_HAS_ARRAY)
1854 ret = 2;
1856 else
1857 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1859 if (ret)
1860 has_protected_decls = true;
1862 return ret;
1865 /* Two helper routines that check for phase 1 and phase 2. These are used
1866 as callbacks for expand_stack_vars. */
1868 static bool
1869 stack_protect_decl_phase_1 (size_t i)
1871 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1874 static bool
1875 stack_protect_decl_phase_2 (size_t i)
1877 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1880 /* And helper function that checks for asan phase (with stack protector
1881 it is phase 3). This is used as callback for expand_stack_vars.
1882 Returns true if any of the vars in the partition need to be protected. */
1884 static bool
1885 asan_decl_phase_3 (size_t i)
1887 while (i != EOC)
1889 if (asan_protect_stack_decl (stack_vars[i].decl))
1890 return true;
1891 i = stack_vars[i].next;
1893 return false;
1896 /* Ensure that variables in different stack protection phases conflict
1897 so that they are not merged and share the same stack slot.
1898 Return true if there are any address taken variables. */
1900 static bool
1901 add_stack_protection_conflicts (void)
1903 size_t i, j, n = stack_vars_num;
1904 unsigned char *phase;
1905 bool ret = false;
1907 phase = XNEWVEC (unsigned char, n);
1908 for (i = 0; i < n; ++i)
1910 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1911 if (TREE_ADDRESSABLE (stack_vars[i].decl))
1912 ret = true;
1915 for (i = 0; i < n; ++i)
1917 unsigned char ph_i = phase[i];
1918 for (j = i + 1; j < n; ++j)
1919 if (ph_i != phase[j])
1920 add_stack_var_conflict (i, j);
1923 XDELETEVEC (phase);
1924 return ret;
1927 /* Create a decl for the guard at the top of the stack frame. */
1929 static void
1930 create_stack_guard (void)
1932 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1933 VAR_DECL, NULL, ptr_type_node);
1934 TREE_THIS_VOLATILE (guard) = 1;
1935 TREE_USED (guard) = 1;
1936 expand_one_stack_var (guard);
1937 crtl->stack_protect_guard = guard;
1940 /* Prepare for expanding variables. */
1941 static void
1942 init_vars_expansion (void)
1944 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1945 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1947 /* A map from decl to stack partition. */
1948 decl_to_stack_part = new hash_map<tree, size_t>;
1950 /* Initialize local stack smashing state. */
1951 has_protected_decls = false;
1952 has_short_buffer = false;
1955 /* Free up stack variable graph data. */
1956 static void
1957 fini_vars_expansion (void)
1959 bitmap_obstack_release (&stack_var_bitmap_obstack);
1960 if (stack_vars)
1961 XDELETEVEC (stack_vars);
1962 if (stack_vars_sorted)
1963 XDELETEVEC (stack_vars_sorted);
1964 stack_vars = NULL;
1965 stack_vars_sorted = NULL;
1966 stack_vars_alloc = stack_vars_num = 0;
1967 delete decl_to_stack_part;
1968 decl_to_stack_part = NULL;
1971 /* Make a fair guess for the size of the stack frame of the function
1972 in NODE. This doesn't have to be exact, the result is only used in
1973 the inline heuristics. So we don't want to run the full stack var
1974 packing algorithm (which is quadratic in the number of stack vars).
1975 Instead, we calculate the total size of all stack vars. This turns
1976 out to be a pretty fair estimate -- packing of stack vars doesn't
1977 happen very often. */
1979 HOST_WIDE_INT
1980 estimated_stack_frame_size (struct cgraph_node *node)
1982 poly_int64 size = 0;
1983 size_t i;
1984 tree var;
1985 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1987 push_cfun (fn);
1989 init_vars_expansion ();
1991 FOR_EACH_LOCAL_DECL (fn, i, var)
1992 if (auto_var_in_fn_p (var, fn->decl))
1993 size += expand_one_var (var, true, false);
1995 if (stack_vars_num > 0)
1997 /* Fake sorting the stack vars for account_stack_vars (). */
1998 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1999 for (i = 0; i < stack_vars_num; ++i)
2000 stack_vars_sorted[i] = i;
2001 size += account_stack_vars ();
2004 fini_vars_expansion ();
2005 pop_cfun ();
2006 return estimated_poly_value (size);
2009 /* Check if the current function has calls that use a return slot. */
2011 static bool
2012 stack_protect_return_slot_p ()
2014 basic_block bb;
2016 FOR_ALL_BB_FN (bb, cfun)
2017 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
2018 !gsi_end_p (gsi); gsi_next (&gsi))
2020 gimple *stmt = gsi_stmt (gsi);
2021 /* This assumes that calls to internal-only functions never
2022 use a return slot. */
2023 if (is_gimple_call (stmt)
2024 && !gimple_call_internal_p (stmt)
2025 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
2026 gimple_call_fndecl (stmt)))
2027 return true;
2029 return false;
2032 /* Expand all variables used in the function. */
2034 static rtx_insn *
2035 expand_used_vars (void)
2037 tree var, outer_block = DECL_INITIAL (current_function_decl);
2038 auto_vec<tree> maybe_local_decls;
2039 rtx_insn *var_end_seq = NULL;
2040 unsigned i;
2041 unsigned len;
2042 bool gen_stack_protect_signal = false;
2044 /* Compute the phase of the stack frame for this function. */
2046 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2047 int off = targetm.starting_frame_offset () % align;
2048 frame_phase = off ? align - off : 0;
2051 /* Set TREE_USED on all variables in the local_decls. */
2052 FOR_EACH_LOCAL_DECL (cfun, i, var)
2053 TREE_USED (var) = 1;
2054 /* Clear TREE_USED on all variables associated with a block scope. */
2055 clear_tree_used (DECL_INITIAL (current_function_decl));
2057 init_vars_expansion ();
2059 if (targetm.use_pseudo_pic_reg ())
2060 pic_offset_table_rtx = gen_reg_rtx (Pmode);
2062 for (i = 0; i < SA.map->num_partitions; i++)
2064 if (bitmap_bit_p (SA.partitions_for_parm_default_defs, i))
2065 continue;
2067 tree var = partition_to_var (SA.map, i);
2069 gcc_assert (!virtual_operand_p (var));
2071 expand_one_ssa_partition (var);
2074 if (flag_stack_protect == SPCT_FLAG_STRONG)
2075 gen_stack_protect_signal = stack_protect_return_slot_p ();
2077 /* At this point all variables on the local_decls with TREE_USED
2078 set are not associated with any block scope. Lay them out. */
2080 len = vec_safe_length (cfun->local_decls);
2081 FOR_EACH_LOCAL_DECL (cfun, i, var)
2083 bool expand_now = false;
2085 /* Expanded above already. */
2086 if (is_gimple_reg (var))
2088 TREE_USED (var) = 0;
2089 goto next;
2091 /* We didn't set a block for static or extern because it's hard
2092 to tell the difference between a global variable (re)declared
2093 in a local scope, and one that's really declared there to
2094 begin with. And it doesn't really matter much, since we're
2095 not giving them stack space. Expand them now. */
2096 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
2097 expand_now = true;
2099 /* Expand variables not associated with any block now. Those created by
2100 the optimizers could be live anywhere in the function. Those that
2101 could possibly have been scoped originally and detached from their
2102 block will have their allocation deferred so we coalesce them with
2103 others when optimization is enabled. */
2104 else if (TREE_USED (var))
2105 expand_now = true;
2107 /* Finally, mark all variables on the list as used. We'll use
2108 this in a moment when we expand those associated with scopes. */
2109 TREE_USED (var) = 1;
2111 if (expand_now)
2112 expand_one_var (var, true, true);
2114 next:
2115 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
2117 rtx rtl = DECL_RTL_IF_SET (var);
2119 /* Keep artificial non-ignored vars in cfun->local_decls
2120 chain until instantiate_decls. */
2121 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2122 add_local_decl (cfun, var);
2123 else if (rtl == NULL_RTX)
2124 /* If rtl isn't set yet, which can happen e.g. with
2125 -fstack-protector, retry before returning from this
2126 function. */
2127 maybe_local_decls.safe_push (var);
2131 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
2133 +-----------------+-----------------+
2134 | ...processed... | ...duplicates...|
2135 +-----------------+-----------------+
2137 +-- LEN points here.
2139 We just want the duplicates, as those are the artificial
2140 non-ignored vars that we want to keep until instantiate_decls.
2141 Move them down and truncate the array. */
2142 if (!vec_safe_is_empty (cfun->local_decls))
2143 cfun->local_decls->block_remove (0, len);
2145 /* At this point, all variables within the block tree with TREE_USED
2146 set are actually used by the optimized function. Lay them out. */
2147 expand_used_vars_for_block (outer_block, true);
2149 tree attribs = DECL_ATTRIBUTES (current_function_decl);
2150 if (stack_vars_num > 0)
2152 bool has_addressable_vars = false;
2154 add_scope_conflicts ();
2156 /* If stack protection is enabled, we don't share space between
2157 vulnerable data and non-vulnerable data. */
2158 if (flag_stack_protect != 0
2159 && !lookup_attribute ("no_stack_protector", attribs)
2160 && (flag_stack_protect != SPCT_FLAG_EXPLICIT
2161 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2162 && lookup_attribute ("stack_protect", attribs))))
2163 has_addressable_vars = add_stack_protection_conflicts ();
2165 if (flag_stack_protect == SPCT_FLAG_STRONG && has_addressable_vars)
2166 gen_stack_protect_signal = true;
2168 /* Now that we have collected all stack variables, and have computed a
2169 minimal interference graph, attempt to save some stack space. */
2170 partition_stack_vars ();
2171 if (dump_file)
2172 dump_stack_var_partition ();
2176 if (!lookup_attribute ("no_stack_protector", attribs))
2177 switch (flag_stack_protect)
2179 case SPCT_FLAG_ALL:
2180 create_stack_guard ();
2181 break;
2183 case SPCT_FLAG_STRONG:
2184 if (gen_stack_protect_signal
2185 || cfun->calls_alloca
2186 || has_protected_decls
2187 || lookup_attribute ("stack_protect",
2188 DECL_ATTRIBUTES (current_function_decl)))
2189 create_stack_guard ();
2190 break;
2192 case SPCT_FLAG_DEFAULT:
2193 if (cfun->calls_alloca
2194 || has_protected_decls
2195 || lookup_attribute ("stack_protect",
2196 DECL_ATTRIBUTES (current_function_decl)))
2197 create_stack_guard ();
2198 break;
2200 case SPCT_FLAG_EXPLICIT:
2201 if (lookup_attribute ("stack_protect",
2202 DECL_ATTRIBUTES (current_function_decl)))
2203 create_stack_guard ();
2204 break;
2206 default:
2207 break;
2210 /* Assign rtl to each variable based on these partitions. */
2211 if (stack_vars_num > 0)
2213 class stack_vars_data data;
2215 data.asan_base = NULL_RTX;
2216 data.asan_alignb = 0;
2218 /* Reorder decls to be protected by iterating over the variables
2219 array multiple times, and allocating out of each phase in turn. */
2220 /* ??? We could probably integrate this into the qsort we did
2221 earlier, such that we naturally see these variables first,
2222 and thus naturally allocate things in the right order. */
2223 if (has_protected_decls)
2225 /* Phase 1 contains only character arrays. */
2226 expand_stack_vars (stack_protect_decl_phase_1, &data);
2228 /* Phase 2 contains other kinds of arrays. */
2229 if (!lookup_attribute ("no_stack_protector", attribs)
2230 && (flag_stack_protect == SPCT_FLAG_ALL
2231 || flag_stack_protect == SPCT_FLAG_STRONG
2232 || (flag_stack_protect == SPCT_FLAG_EXPLICIT
2233 && lookup_attribute ("stack_protect", attribs))))
2234 expand_stack_vars (stack_protect_decl_phase_2, &data);
2237 if (asan_sanitize_stack_p ())
2238 /* Phase 3, any partitions that need asan protection
2239 in addition to phase 1 and 2. */
2240 expand_stack_vars (asan_decl_phase_3, &data);
2242 /* ASAN description strings don't yet have a syntax for expressing
2243 polynomial offsets. */
2244 HOST_WIDE_INT prev_offset;
2245 if (!data.asan_vec.is_empty ()
2246 && frame_offset.is_constant (&prev_offset))
2248 HOST_WIDE_INT offset, sz, redzonesz;
2249 redzonesz = ASAN_RED_ZONE_SIZE;
2250 sz = data.asan_vec[0] - prev_offset;
2251 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
2252 && data.asan_alignb <= 4096
2253 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
2254 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
2255 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
2256 /* Allocating a constant amount of space from a constant
2257 starting offset must give a constant result. */
2258 offset = (alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE)
2259 .to_constant ());
2260 data.asan_vec.safe_push (prev_offset);
2261 data.asan_vec.safe_push (offset);
2262 /* Leave space for alignment if STRICT_ALIGNMENT. */
2263 if (STRICT_ALIGNMENT)
2264 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
2265 << ASAN_SHADOW_SHIFT)
2266 / BITS_PER_UNIT, 1);
2268 var_end_seq
2269 = asan_emit_stack_protection (virtual_stack_vars_rtx,
2270 data.asan_base,
2271 data.asan_alignb,
2272 data.asan_vec.address (),
2273 data.asan_decl_vec.address (),
2274 data.asan_vec.length ());
2277 expand_stack_vars (NULL, &data);
2280 if (asan_sanitize_allocas_p () && cfun->calls_alloca)
2281 var_end_seq = asan_emit_allocas_unpoison (virtual_stack_dynamic_rtx,
2282 virtual_stack_vars_rtx,
2283 var_end_seq);
2285 fini_vars_expansion ();
2287 /* If there were any artificial non-ignored vars without rtl
2288 found earlier, see if deferred stack allocation hasn't assigned
2289 rtl to them. */
2290 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
2292 rtx rtl = DECL_RTL_IF_SET (var);
2294 /* Keep artificial non-ignored vars in cfun->local_decls
2295 chain until instantiate_decls. */
2296 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
2297 add_local_decl (cfun, var);
2300 /* If the target requires that FRAME_OFFSET be aligned, do it. */
2301 if (STACK_ALIGNMENT_NEEDED)
2303 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
2304 if (FRAME_GROWS_DOWNWARD)
2305 frame_offset = aligned_lower_bound (frame_offset, align);
2306 else
2307 frame_offset = aligned_upper_bound (frame_offset, align);
2310 return var_end_seq;
2314 /* If we need to produce a detailed dump, print the tree representation
2315 for STMT to the dump file. SINCE is the last RTX after which the RTL
2316 generated for STMT should have been appended. */
2318 static void
2319 maybe_dump_rtl_for_gimple_stmt (gimple *stmt, rtx_insn *since)
2321 if (dump_file && (dump_flags & TDF_DETAILS))
2323 fprintf (dump_file, "\n;; ");
2324 print_gimple_stmt (dump_file, stmt, 0,
2325 TDF_SLIM | (dump_flags & TDF_LINENO));
2326 fprintf (dump_file, "\n");
2328 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
2332 /* Maps the blocks that do not contain tree labels to rtx labels. */
2334 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
2336 /* Returns the label_rtx expression for a label starting basic block BB. */
2338 static rtx_code_label *
2339 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
2341 gimple_stmt_iterator gsi;
2342 tree lab;
2344 if (bb->flags & BB_RTL)
2345 return block_label (bb);
2347 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
2348 if (elt)
2349 return *elt;
2351 /* Find the tree label if it is present. */
2353 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
2355 glabel *lab_stmt;
2357 lab_stmt = dyn_cast <glabel *> (gsi_stmt (gsi));
2358 if (!lab_stmt)
2359 break;
2361 lab = gimple_label_label (lab_stmt);
2362 if (DECL_NONLOCAL (lab))
2363 break;
2365 return jump_target_rtx (lab);
2368 rtx_code_label *l = gen_label_rtx ();
2369 lab_rtx_for_bb->put (bb, l);
2370 return l;
2374 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2375 of a basic block where we just expanded the conditional at the end,
2376 possibly clean up the CFG and instruction sequence. LAST is the
2377 last instruction before the just emitted jump sequence. */
2379 static void
2380 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2382 /* Special case: when jumpif decides that the condition is
2383 trivial it emits an unconditional jump (and the necessary
2384 barrier). But we still have two edges, the fallthru one is
2385 wrong. purge_dead_edges would clean this up later. Unfortunately
2386 we have to insert insns (and split edges) before
2387 find_many_sub_basic_blocks and hence before purge_dead_edges.
2388 But splitting edges might create new blocks which depend on the
2389 fact that if there are two edges there's no barrier. So the
2390 barrier would get lost and verify_flow_info would ICE. Instead
2391 of auditing all edge splitters to care for the barrier (which
2392 normally isn't there in a cleaned CFG), fix it here. */
2393 if (BARRIER_P (get_last_insn ()))
2395 rtx_insn *insn;
2396 remove_edge (e);
2397 /* Now, we have a single successor block, if we have insns to
2398 insert on the remaining edge we potentially will insert
2399 it at the end of this block (if the dest block isn't feasible)
2400 in order to avoid splitting the edge. This insertion will take
2401 place in front of the last jump. But we might have emitted
2402 multiple jumps (conditional and one unconditional) to the
2403 same destination. Inserting in front of the last one then
2404 is a problem. See PR 40021. We fix this by deleting all
2405 jumps except the last unconditional one. */
2406 insn = PREV_INSN (get_last_insn ());
2407 /* Make sure we have an unconditional jump. Otherwise we're
2408 confused. */
2409 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2410 for (insn = PREV_INSN (insn); insn != last;)
2412 insn = PREV_INSN (insn);
2413 if (JUMP_P (NEXT_INSN (insn)))
2415 if (!any_condjump_p (NEXT_INSN (insn)))
2417 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2418 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2420 delete_insn (NEXT_INSN (insn));
2426 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2427 Returns a new basic block if we've terminated the current basic
2428 block and created a new one. */
2430 static basic_block
2431 expand_gimple_cond (basic_block bb, gcond *stmt)
2433 basic_block new_bb, dest;
2434 edge true_edge;
2435 edge false_edge;
2436 rtx_insn *last2, *last;
2437 enum tree_code code;
2438 tree op0, op1;
2440 code = gimple_cond_code (stmt);
2441 op0 = gimple_cond_lhs (stmt);
2442 op1 = gimple_cond_rhs (stmt);
2443 /* We're sometimes presented with such code:
2444 D.123_1 = x < y;
2445 if (D.123_1 != 0)
2447 This would expand to two comparisons which then later might
2448 be cleaned up by combine. But some pattern matchers like if-conversion
2449 work better when there's only one compare, so make up for this
2450 here as special exception if TER would have made the same change. */
2451 if (SA.values
2452 && TREE_CODE (op0) == SSA_NAME
2453 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2454 && TREE_CODE (op1) == INTEGER_CST
2455 && ((gimple_cond_code (stmt) == NE_EXPR
2456 && integer_zerop (op1))
2457 || (gimple_cond_code (stmt) == EQ_EXPR
2458 && integer_onep (op1)))
2459 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2461 gimple *second = SSA_NAME_DEF_STMT (op0);
2462 if (gimple_code (second) == GIMPLE_ASSIGN)
2464 enum tree_code code2 = gimple_assign_rhs_code (second);
2465 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2467 code = code2;
2468 op0 = gimple_assign_rhs1 (second);
2469 op1 = gimple_assign_rhs2 (second);
2471 /* If jumps are cheap and the target does not support conditional
2472 compare, turn some more codes into jumpy sequences. */
2473 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4
2474 && targetm.gen_ccmp_first == NULL)
2476 if ((code2 == BIT_AND_EXPR
2477 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2478 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2479 || code2 == TRUTH_AND_EXPR)
2481 code = TRUTH_ANDIF_EXPR;
2482 op0 = gimple_assign_rhs1 (second);
2483 op1 = gimple_assign_rhs2 (second);
2485 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2487 code = TRUTH_ORIF_EXPR;
2488 op0 = gimple_assign_rhs1 (second);
2489 op1 = gimple_assign_rhs2 (second);
2495 /* Optimize (x % C1) == C2 or (x % C1) != C2 if it is beneficial
2496 into (x - C2) * C3 < C4. */
2497 if ((code == EQ_EXPR || code == NE_EXPR)
2498 && TREE_CODE (op0) == SSA_NAME
2499 && TREE_CODE (op1) == INTEGER_CST)
2500 code = maybe_optimize_mod_cmp (code, &op0, &op1);
2502 last2 = last = get_last_insn ();
2504 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2505 set_curr_insn_location (gimple_location (stmt));
2507 /* These flags have no purpose in RTL land. */
2508 true_edge->flags &= ~EDGE_TRUE_VALUE;
2509 false_edge->flags &= ~EDGE_FALSE_VALUE;
2511 /* We can either have a pure conditional jump with one fallthru edge or
2512 two-way jump that needs to be decomposed into two basic blocks. */
2513 if (false_edge->dest == bb->next_bb)
2515 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2516 true_edge->probability);
2517 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2518 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2519 set_curr_insn_location (true_edge->goto_locus);
2520 false_edge->flags |= EDGE_FALLTHRU;
2521 maybe_cleanup_end_of_block (false_edge, last);
2522 return NULL;
2524 if (true_edge->dest == bb->next_bb)
2526 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2527 false_edge->probability);
2528 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2529 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2530 set_curr_insn_location (false_edge->goto_locus);
2531 true_edge->flags |= EDGE_FALLTHRU;
2532 maybe_cleanup_end_of_block (true_edge, last);
2533 return NULL;
2536 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2537 true_edge->probability);
2538 last = get_last_insn ();
2539 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2540 set_curr_insn_location (false_edge->goto_locus);
2541 emit_jump (label_rtx_for_bb (false_edge->dest));
2543 BB_END (bb) = last;
2544 if (BARRIER_P (BB_END (bb)))
2545 BB_END (bb) = PREV_INSN (BB_END (bb));
2546 update_bb_for_insn (bb);
2548 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2549 dest = false_edge->dest;
2550 redirect_edge_succ (false_edge, new_bb);
2551 false_edge->flags |= EDGE_FALLTHRU;
2552 new_bb->count = false_edge->count ();
2553 loop_p loop = find_common_loop (bb->loop_father, dest->loop_father);
2554 add_bb_to_loop (new_bb, loop);
2555 if (loop->latch == bb
2556 && loop->header == dest)
2557 loop->latch = new_bb;
2558 make_single_succ_edge (new_bb, dest, 0);
2559 if (BARRIER_P (BB_END (new_bb)))
2560 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2561 update_bb_for_insn (new_bb);
2563 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2565 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2567 set_curr_insn_location (true_edge->goto_locus);
2568 true_edge->goto_locus = curr_insn_location ();
2571 return new_bb;
2574 /* Mark all calls that can have a transaction restart. */
2576 static void
2577 mark_transaction_restart_calls (gimple *stmt)
2579 struct tm_restart_node dummy;
2580 tm_restart_node **slot;
2582 if (!cfun->gimple_df->tm_restart)
2583 return;
2585 dummy.stmt = stmt;
2586 slot = cfun->gimple_df->tm_restart->find_slot (&dummy, NO_INSERT);
2587 if (slot)
2589 struct tm_restart_node *n = *slot;
2590 tree list = n->label_or_list;
2591 rtx_insn *insn;
2593 for (insn = next_real_insn (get_last_insn ());
2594 !CALL_P (insn);
2595 insn = next_real_insn (insn))
2596 continue;
2598 if (TREE_CODE (list) == LABEL_DECL)
2599 add_reg_note (insn, REG_TM, label_rtx (list));
2600 else
2601 for (; list ; list = TREE_CHAIN (list))
2602 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2606 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2607 statement STMT. */
2609 static void
2610 expand_call_stmt (gcall *stmt)
2612 tree exp, decl, lhs;
2613 bool builtin_p;
2614 size_t i;
2616 if (gimple_call_internal_p (stmt))
2618 expand_internal_call (stmt);
2619 return;
2622 /* If this is a call to a built-in function and it has no effect other
2623 than setting the lhs, try to implement it using an internal function
2624 instead. */
2625 decl = gimple_call_fndecl (stmt);
2626 if (gimple_call_lhs (stmt)
2627 && !gimple_has_side_effects (stmt)
2628 && (optimize || (decl && called_as_built_in (decl))))
2630 internal_fn ifn = replacement_internal_fn (stmt);
2631 if (ifn != IFN_LAST)
2633 expand_internal_call (ifn, stmt);
2634 return;
2638 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2640 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2641 builtin_p = decl && fndecl_built_in_p (decl);
2643 /* If this is not a builtin function, the function type through which the
2644 call is made may be different from the type of the function. */
2645 if (!builtin_p)
2646 CALL_EXPR_FN (exp)
2647 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2648 CALL_EXPR_FN (exp));
2650 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2651 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2653 for (i = 0; i < gimple_call_num_args (stmt); i++)
2655 tree arg = gimple_call_arg (stmt, i);
2656 gimple *def;
2657 /* TER addresses into arguments of builtin functions so we have a
2658 chance to infer more correct alignment information. See PR39954. */
2659 if (builtin_p
2660 && TREE_CODE (arg) == SSA_NAME
2661 && (def = get_gimple_for_ssa_name (arg))
2662 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2663 arg = gimple_assign_rhs1 (def);
2664 CALL_EXPR_ARG (exp, i) = arg;
2667 if (gimple_has_side_effects (stmt))
2668 TREE_SIDE_EFFECTS (exp) = 1;
2670 if (gimple_call_nothrow_p (stmt))
2671 TREE_NOTHROW (exp) = 1;
2673 if (gimple_no_warning_p (stmt))
2674 TREE_NO_WARNING (exp) = 1;
2676 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2677 CALL_EXPR_MUST_TAIL_CALL (exp) = gimple_call_must_tail_p (stmt);
2678 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2679 if (decl
2680 && fndecl_built_in_p (decl, BUILT_IN_NORMAL)
2681 && ALLOCA_FUNCTION_CODE_P (DECL_FUNCTION_CODE (decl)))
2682 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2683 else
2684 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2685 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2686 CALL_EXPR_BY_DESCRIPTOR (exp) = gimple_call_by_descriptor_p (stmt);
2687 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2689 /* Ensure RTL is created for debug args. */
2690 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2692 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2693 unsigned int ix;
2694 tree dtemp;
2696 if (debug_args)
2697 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2699 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2700 expand_debug_expr (dtemp);
2704 rtx_insn *before_call = get_last_insn ();
2705 lhs = gimple_call_lhs (stmt);
2706 if (lhs)
2707 expand_assignment (lhs, exp, false);
2708 else
2709 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2711 /* If the gimple call is an indirect call and has 'nocf_check'
2712 attribute find a generated CALL insn to mark it as no
2713 control-flow verification is needed. */
2714 if (gimple_call_nocf_check_p (stmt)
2715 && !gimple_call_fndecl (stmt))
2717 rtx_insn *last = get_last_insn ();
2718 while (!CALL_P (last)
2719 && last != before_call)
2720 last = PREV_INSN (last);
2722 if (last != before_call)
2723 add_reg_note (last, REG_CALL_NOCF_CHECK, const0_rtx);
2726 mark_transaction_restart_calls (stmt);
2730 /* Generate RTL for an asm statement (explicit assembler code).
2731 STRING is a STRING_CST node containing the assembler code text,
2732 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2733 insn is volatile; don't optimize it. */
2735 static void
2736 expand_asm_loc (tree string, int vol, location_t locus)
2738 rtx body;
2740 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2741 ggc_strdup (TREE_STRING_POINTER (string)),
2742 locus);
2744 MEM_VOLATILE_P (body) = vol;
2746 /* Non-empty basic ASM implicitly clobbers memory. */
2747 if (TREE_STRING_LENGTH (string) != 0)
2749 rtx asm_op, clob;
2750 unsigned i, nclobbers;
2751 auto_vec<rtx> input_rvec, output_rvec;
2752 auto_vec<const char *> constraints;
2753 auto_vec<rtx> clobber_rvec;
2754 HARD_REG_SET clobbered_regs;
2755 CLEAR_HARD_REG_SET (clobbered_regs);
2757 clob = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
2758 clobber_rvec.safe_push (clob);
2760 if (targetm.md_asm_adjust)
2761 targetm.md_asm_adjust (output_rvec, input_rvec,
2762 constraints, clobber_rvec,
2763 clobbered_regs);
2765 asm_op = body;
2766 nclobbers = clobber_rvec.length ();
2767 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (1 + nclobbers));
2769 XVECEXP (body, 0, 0) = asm_op;
2770 for (i = 0; i < nclobbers; i++)
2771 XVECEXP (body, 0, i + 1) = gen_rtx_CLOBBER (VOIDmode, clobber_rvec[i]);
2774 emit_insn (body);
2777 /* Return the number of times character C occurs in string S. */
2778 static int
2779 n_occurrences (int c, const char *s)
2781 int n = 0;
2782 while (*s)
2783 n += (*s++ == c);
2784 return n;
2787 /* A subroutine of expand_asm_operands. Check that all operands have
2788 the same number of alternatives. Return true if so. */
2790 static bool
2791 check_operand_nalternatives (const vec<const char *> &constraints)
2793 unsigned len = constraints.length();
2794 if (len > 0)
2796 int nalternatives = n_occurrences (',', constraints[0]);
2798 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2800 error ("too many alternatives in %<asm%>");
2801 return false;
2804 for (unsigned i = 1; i < len; ++i)
2805 if (n_occurrences (',', constraints[i]) != nalternatives)
2807 error ("operand constraints for %<asm%> differ "
2808 "in number of alternatives");
2809 return false;
2812 return true;
2815 /* Check for overlap between registers marked in CLOBBERED_REGS and
2816 anything inappropriate in T. Emit error and return the register
2817 variable definition for error, NULL_TREE for ok. */
2819 static bool
2820 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2822 /* Conflicts between asm-declared register variables and the clobber
2823 list are not allowed. */
2824 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2826 if (overlap)
2828 error ("%<asm%> specifier for variable %qE conflicts with "
2829 "%<asm%> clobber list",
2830 DECL_NAME (overlap));
2832 /* Reset registerness to stop multiple errors emitted for a single
2833 variable. */
2834 DECL_REGISTER (overlap) = 0;
2835 return true;
2838 return false;
2841 /* Check that the given REGNO spanning NREGS is a valid
2842 asm clobber operand. Some HW registers cannot be
2843 saved/restored, hence they should not be clobbered by
2844 asm statements. */
2845 static bool
2846 asm_clobber_reg_is_valid (int regno, int nregs, const char *regname)
2848 bool is_valid = true;
2849 HARD_REG_SET regset;
2851 CLEAR_HARD_REG_SET (regset);
2853 add_range_to_hard_reg_set (&regset, regno, nregs);
2855 /* Clobbering the PIC register is an error. */
2856 if (PIC_OFFSET_TABLE_REGNUM != INVALID_REGNUM
2857 && overlaps_hard_reg_set_p (regset, Pmode, PIC_OFFSET_TABLE_REGNUM))
2859 /* ??? Diagnose during gimplification? */
2860 error ("PIC register clobbered by %qs in %<asm%>", regname);
2861 is_valid = false;
2863 else if (!in_hard_reg_set_p
2864 (accessible_reg_set, reg_raw_mode[regno], regno))
2866 /* ??? Diagnose during gimplification? */
2867 error ("the register %qs cannot be clobbered in %<asm%>"
2868 " for the current target", regname);
2869 is_valid = false;
2872 /* Clobbering the stack pointer register is deprecated. GCC expects
2873 the value of the stack pointer after an asm statement to be the same
2874 as it was before, so no asm can validly clobber the stack pointer in
2875 the usual sense. Adding the stack pointer to the clobber list has
2876 traditionally had some undocumented and somewhat obscure side-effects. */
2877 if (overlaps_hard_reg_set_p (regset, Pmode, STACK_POINTER_REGNUM))
2879 crtl->sp_is_clobbered_by_asm = true;
2880 if (warning (OPT_Wdeprecated, "listing the stack pointer register"
2881 " %qs in a clobber list is deprecated", regname))
2882 inform (input_location, "the value of the stack pointer after"
2883 " an %<asm%> statement must be the same as it was before"
2884 " the statement");
2887 return is_valid;
2890 /* Generate RTL for an asm statement with arguments.
2891 STRING is the instruction template.
2892 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2893 Each output or input has an expression in the TREE_VALUE and
2894 a tree list in TREE_PURPOSE which in turn contains a constraint
2895 name in TREE_VALUE (or NULL_TREE) and a constraint string
2896 in TREE_PURPOSE.
2897 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2898 that is clobbered by this insn.
2900 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2901 should be the fallthru basic block of the asm goto.
2903 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2904 Some elements of OUTPUTS may be replaced with trees representing temporary
2905 values. The caller should copy those temporary values to the originally
2906 specified lvalues.
2908 VOL nonzero means the insn is volatile; don't optimize it. */
2910 static void
2911 expand_asm_stmt (gasm *stmt)
2913 class save_input_location
2915 location_t old;
2917 public:
2918 explicit save_input_location(location_t where)
2920 old = input_location;
2921 input_location = where;
2924 ~save_input_location()
2926 input_location = old;
2930 location_t locus = gimple_location (stmt);
2932 if (gimple_asm_input_p (stmt))
2934 const char *s = gimple_asm_string (stmt);
2935 tree string = build_string (strlen (s), s);
2936 expand_asm_loc (string, gimple_asm_volatile_p (stmt), locus);
2937 return;
2940 /* There are some legacy diagnostics in here, and also avoids a
2941 sixth parameger to targetm.md_asm_adjust. */
2942 save_input_location s_i_l(locus);
2944 unsigned noutputs = gimple_asm_noutputs (stmt);
2945 unsigned ninputs = gimple_asm_ninputs (stmt);
2946 unsigned nlabels = gimple_asm_nlabels (stmt);
2947 unsigned i;
2949 /* ??? Diagnose during gimplification? */
2950 if (ninputs + noutputs + nlabels > MAX_RECOG_OPERANDS)
2952 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2953 return;
2956 auto_vec<tree, MAX_RECOG_OPERANDS> output_tvec;
2957 auto_vec<tree, MAX_RECOG_OPERANDS> input_tvec;
2958 auto_vec<const char *, MAX_RECOG_OPERANDS> constraints;
2960 /* Copy the gimple vectors into new vectors that we can manipulate. */
2962 output_tvec.safe_grow (noutputs, true);
2963 input_tvec.safe_grow (ninputs, true);
2964 constraints.safe_grow (noutputs + ninputs, true);
2966 for (i = 0; i < noutputs; ++i)
2968 tree t = gimple_asm_output_op (stmt, i);
2969 output_tvec[i] = TREE_VALUE (t);
2970 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2972 for (i = 0; i < ninputs; i++)
2974 tree t = gimple_asm_input_op (stmt, i);
2975 input_tvec[i] = TREE_VALUE (t);
2976 constraints[i + noutputs]
2977 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2980 /* ??? Diagnose during gimplification? */
2981 if (! check_operand_nalternatives (constraints))
2982 return;
2984 /* Count the number of meaningful clobbered registers, ignoring what
2985 we would ignore later. */
2986 auto_vec<rtx> clobber_rvec;
2987 HARD_REG_SET clobbered_regs;
2988 CLEAR_HARD_REG_SET (clobbered_regs);
2990 if (unsigned n = gimple_asm_nclobbers (stmt))
2992 clobber_rvec.reserve (n);
2993 for (i = 0; i < n; i++)
2995 tree t = gimple_asm_clobber_op (stmt, i);
2996 const char *regname = TREE_STRING_POINTER (TREE_VALUE (t));
2997 int nregs, j;
2999 j = decode_reg_name_and_count (regname, &nregs);
3000 if (j < 0)
3002 if (j == -2)
3004 /* ??? Diagnose during gimplification? */
3005 error ("unknown register name %qs in %<asm%>", regname);
3007 else if (j == -4)
3009 rtx x = gen_rtx_MEM (BLKmode, gen_rtx_SCRATCH (VOIDmode));
3010 clobber_rvec.safe_push (x);
3012 else
3014 /* Otherwise we should have -1 == empty string
3015 or -3 == cc, which is not a register. */
3016 gcc_assert (j == -1 || j == -3);
3019 else
3020 for (int reg = j; reg < j + nregs; reg++)
3022 if (!asm_clobber_reg_is_valid (reg, nregs, regname))
3023 return;
3025 SET_HARD_REG_BIT (clobbered_regs, reg);
3026 rtx x = gen_rtx_REG (reg_raw_mode[reg], reg);
3027 clobber_rvec.safe_push (x);
3032 /* First pass over inputs and outputs checks validity and sets
3033 mark_addressable if needed. */
3034 /* ??? Diagnose during gimplification? */
3036 for (i = 0; i < noutputs; ++i)
3038 tree val = output_tvec[i];
3039 tree type = TREE_TYPE (val);
3040 const char *constraint;
3041 bool is_inout;
3042 bool allows_reg;
3043 bool allows_mem;
3045 /* Try to parse the output constraint. If that fails, there's
3046 no point in going further. */
3047 constraint = constraints[i];
3048 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
3049 &allows_mem, &allows_reg, &is_inout))
3050 return;
3052 /* If the output is a hard register, verify it doesn't conflict with
3053 any other operand's possible hard register use. */
3054 if (DECL_P (val)
3055 && REG_P (DECL_RTL (val))
3056 && HARD_REGISTER_P (DECL_RTL (val)))
3058 unsigned j, output_hregno = REGNO (DECL_RTL (val));
3059 bool early_clobber_p = strchr (constraints[i], '&') != NULL;
3060 unsigned long match;
3062 /* Verify the other outputs do not use the same hard register. */
3063 for (j = i + 1; j < noutputs; ++j)
3064 if (DECL_P (output_tvec[j])
3065 && REG_P (DECL_RTL (output_tvec[j]))
3066 && HARD_REGISTER_P (DECL_RTL (output_tvec[j]))
3067 && output_hregno == REGNO (DECL_RTL (output_tvec[j])))
3068 error ("invalid hard register usage between output operands");
3070 /* Verify matching constraint operands use the same hard register
3071 and that the non-matching constraint operands do not use the same
3072 hard register if the output is an early clobber operand. */
3073 for (j = 0; j < ninputs; ++j)
3074 if (DECL_P (input_tvec[j])
3075 && REG_P (DECL_RTL (input_tvec[j]))
3076 && HARD_REGISTER_P (DECL_RTL (input_tvec[j])))
3078 unsigned input_hregno = REGNO (DECL_RTL (input_tvec[j]));
3079 switch (*constraints[j + noutputs])
3081 case '0': case '1': case '2': case '3': case '4':
3082 case '5': case '6': case '7': case '8': case '9':
3083 match = strtoul (constraints[j + noutputs], NULL, 10);
3084 break;
3085 default:
3086 match = ULONG_MAX;
3087 break;
3089 if (i == match
3090 && output_hregno != input_hregno)
3091 error ("invalid hard register usage between output operand "
3092 "and matching constraint operand");
3093 else if (early_clobber_p
3094 && i != match
3095 && output_hregno == input_hregno)
3096 error ("invalid hard register usage between earlyclobber "
3097 "operand and input operand");
3101 if (! allows_reg
3102 && (allows_mem
3103 || is_inout
3104 || (DECL_P (val)
3105 && REG_P (DECL_RTL (val))
3106 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
3107 mark_addressable (val);
3110 for (i = 0; i < ninputs; ++i)
3112 bool allows_reg, allows_mem;
3113 const char *constraint;
3115 constraint = constraints[i + noutputs];
3116 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3117 constraints.address (),
3118 &allows_mem, &allows_reg))
3119 return;
3121 if (! allows_reg && allows_mem)
3122 mark_addressable (input_tvec[i]);
3125 /* Second pass evaluates arguments. */
3127 /* Make sure stack is consistent for asm goto. */
3128 if (nlabels > 0)
3129 do_pending_stack_adjust ();
3130 int old_generating_concat_p = generating_concat_p;
3132 /* Vector of RTX's of evaluated output operands. */
3133 auto_vec<rtx, MAX_RECOG_OPERANDS> output_rvec;
3134 auto_vec<int, MAX_RECOG_OPERANDS> inout_opnum;
3135 rtx_insn *after_rtl_seq = NULL, *after_rtl_end = NULL;
3137 output_rvec.safe_grow (noutputs, true);
3139 for (i = 0; i < noutputs; ++i)
3141 tree val = output_tvec[i];
3142 tree type = TREE_TYPE (val);
3143 bool is_inout, allows_reg, allows_mem, ok;
3144 rtx op;
3146 ok = parse_output_constraint (&constraints[i], i, ninputs,
3147 noutputs, &allows_mem, &allows_reg,
3148 &is_inout);
3149 gcc_assert (ok);
3151 /* If an output operand is not a decl or indirect ref and our constraint
3152 allows a register, make a temporary to act as an intermediate.
3153 Make the asm insn write into that, then we will copy it to
3154 the real output operand. Likewise for promoted variables. */
3156 generating_concat_p = 0;
3158 if ((TREE_CODE (val) == INDIRECT_REF && allows_mem)
3159 || (DECL_P (val)
3160 && (allows_mem || REG_P (DECL_RTL (val)))
3161 && ! (REG_P (DECL_RTL (val))
3162 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
3163 || ! allows_reg
3164 || is_inout
3165 || TREE_ADDRESSABLE (type))
3167 op = expand_expr (val, NULL_RTX, VOIDmode,
3168 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
3169 if (MEM_P (op))
3170 op = validize_mem (op);
3172 if (! allows_reg && !MEM_P (op))
3173 error ("output number %d not directly addressable", i);
3174 if ((! allows_mem && MEM_P (op) && GET_MODE (op) != BLKmode)
3175 || GET_CODE (op) == CONCAT)
3177 rtx old_op = op;
3178 op = gen_reg_rtx (GET_MODE (op));
3180 generating_concat_p = old_generating_concat_p;
3182 if (is_inout)
3183 emit_move_insn (op, old_op);
3185 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3186 emit_move_insn (old_op, op);
3187 after_rtl_seq = get_insns ();
3188 after_rtl_end = get_last_insn ();
3189 end_sequence ();
3192 else
3194 op = assign_temp (type, 0, 1);
3195 op = validize_mem (op);
3196 if (!MEM_P (op) && TREE_CODE (val) == SSA_NAME)
3197 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (val), op);
3199 generating_concat_p = old_generating_concat_p;
3201 push_to_sequence2 (after_rtl_seq, after_rtl_end);
3202 expand_assignment (val, make_tree (type, op), false);
3203 after_rtl_seq = get_insns ();
3204 after_rtl_end = get_last_insn ();
3205 end_sequence ();
3207 output_rvec[i] = op;
3209 if (is_inout)
3210 inout_opnum.safe_push (i);
3213 auto_vec<rtx, MAX_RECOG_OPERANDS> input_rvec;
3214 auto_vec<machine_mode, MAX_RECOG_OPERANDS> input_mode;
3216 input_rvec.safe_grow (ninputs, true);
3217 input_mode.safe_grow (ninputs, true);
3219 generating_concat_p = 0;
3221 for (i = 0; i < ninputs; ++i)
3223 tree val = input_tvec[i];
3224 tree type = TREE_TYPE (val);
3225 bool allows_reg, allows_mem, ok;
3226 const char *constraint;
3227 rtx op;
3229 constraint = constraints[i + noutputs];
3230 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, 0,
3231 constraints.address (),
3232 &allows_mem, &allows_reg);
3233 gcc_assert (ok);
3235 /* EXPAND_INITIALIZER will not generate code for valid initializer
3236 constants, but will still generate code for other types of operand.
3237 This is the behavior we want for constant constraints. */
3238 op = expand_expr (val, NULL_RTX, VOIDmode,
3239 allows_reg ? EXPAND_NORMAL
3240 : allows_mem ? EXPAND_MEMORY
3241 : EXPAND_INITIALIZER);
3243 /* Never pass a CONCAT to an ASM. */
3244 if (GET_CODE (op) == CONCAT)
3245 op = force_reg (GET_MODE (op), op);
3246 else if (MEM_P (op))
3247 op = validize_mem (op);
3249 if (asm_operand_ok (op, constraint, NULL) <= 0)
3251 if (allows_reg && TYPE_MODE (type) != BLKmode)
3252 op = force_reg (TYPE_MODE (type), op);
3253 else if (!allows_mem)
3254 warning (0, "%<asm%> operand %d probably does not match "
3255 "constraints",
3256 i + noutputs);
3257 else if (MEM_P (op))
3259 /* We won't recognize either volatile memory or memory
3260 with a queued address as available a memory_operand
3261 at this point. Ignore it: clearly this *is* a memory. */
3263 else
3264 gcc_unreachable ();
3266 input_rvec[i] = op;
3267 input_mode[i] = TYPE_MODE (type);
3270 /* For in-out operands, copy output rtx to input rtx. */
3271 unsigned ninout = inout_opnum.length();
3272 for (i = 0; i < ninout; i++)
3274 int j = inout_opnum[i];
3275 rtx o = output_rvec[j];
3277 input_rvec.safe_push (o);
3278 input_mode.safe_push (GET_MODE (o));
3280 char buffer[16];
3281 sprintf (buffer, "%d", j);
3282 constraints.safe_push (ggc_strdup (buffer));
3284 ninputs += ninout;
3286 /* Sometimes we wish to automatically clobber registers across an asm.
3287 Case in point is when the i386 backend moved from cc0 to a hard reg --
3288 maintaining source-level compatibility means automatically clobbering
3289 the flags register. */
3290 rtx_insn *after_md_seq = NULL;
3291 if (targetm.md_asm_adjust)
3292 after_md_seq = targetm.md_asm_adjust (output_rvec, input_rvec,
3293 constraints, clobber_rvec,
3294 clobbered_regs);
3296 /* Do not allow the hook to change the output and input count,
3297 lest it mess up the operand numbering. */
3298 gcc_assert (output_rvec.length() == noutputs);
3299 gcc_assert (input_rvec.length() == ninputs);
3300 gcc_assert (constraints.length() == noutputs + ninputs);
3302 /* But it certainly can adjust the clobbers. */
3303 unsigned nclobbers = clobber_rvec.length ();
3305 /* Third pass checks for easy conflicts. */
3306 /* ??? Why are we doing this on trees instead of rtx. */
3308 bool clobber_conflict_found = 0;
3309 for (i = 0; i < noutputs; ++i)
3310 if (tree_conflicts_with_clobbers_p (output_tvec[i], &clobbered_regs))
3311 clobber_conflict_found = 1;
3312 for (i = 0; i < ninputs - ninout; ++i)
3313 if (tree_conflicts_with_clobbers_p (input_tvec[i], &clobbered_regs))
3314 clobber_conflict_found = 1;
3316 /* Make vectors for the expression-rtx, constraint strings,
3317 and named operands. */
3319 rtvec argvec = rtvec_alloc (ninputs);
3320 rtvec constraintvec = rtvec_alloc (ninputs);
3321 rtvec labelvec = rtvec_alloc (nlabels);
3323 rtx body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
3324 : GET_MODE (output_rvec[0])),
3325 ggc_strdup (gimple_asm_string (stmt)),
3326 "", 0, argvec, constraintvec,
3327 labelvec, locus);
3328 MEM_VOLATILE_P (body) = gimple_asm_volatile_p (stmt);
3330 for (i = 0; i < ninputs; ++i)
3332 ASM_OPERANDS_INPUT (body, i) = input_rvec[i];
3333 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
3334 = gen_rtx_ASM_INPUT_loc (input_mode[i],
3335 constraints[i + noutputs],
3336 locus);
3339 /* Copy labels to the vector. */
3340 rtx_code_label *fallthru_label = NULL;
3341 if (nlabels > 0)
3343 basic_block fallthru_bb = NULL;
3344 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
3345 if (fallthru)
3346 fallthru_bb = fallthru->dest;
3348 for (i = 0; i < nlabels; ++i)
3350 tree label = TREE_VALUE (gimple_asm_label_op (stmt, i));
3351 rtx_insn *r;
3352 /* If asm goto has any labels in the fallthru basic block, use
3353 a label that we emit immediately after the asm goto. Expansion
3354 may insert further instructions into the same basic block after
3355 asm goto and if we don't do this, insertion of instructions on
3356 the fallthru edge might misbehave. See PR58670. */
3357 if (fallthru_bb && label_to_block (cfun, label) == fallthru_bb)
3359 if (fallthru_label == NULL_RTX)
3360 fallthru_label = gen_label_rtx ();
3361 r = fallthru_label;
3363 else
3364 r = label_rtx (label);
3365 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
3369 /* Now, for each output, construct an rtx
3370 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
3371 ARGVEC CONSTRAINTS OPNAMES))
3372 If there is more than one, put them inside a PARALLEL. */
3374 if (noutputs == 0 && nclobbers == 0)
3376 /* No output operands: put in a raw ASM_OPERANDS rtx. */
3377 if (nlabels > 0)
3378 emit_jump_insn (body);
3379 else
3380 emit_insn (body);
3382 else if (noutputs == 1 && nclobbers == 0)
3384 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = constraints[0];
3385 if (nlabels > 0)
3386 emit_jump_insn (gen_rtx_SET (output_rvec[0], body));
3387 else
3388 emit_insn (gen_rtx_SET (output_rvec[0], body));
3390 else
3392 rtx obody = body;
3393 int num = noutputs;
3395 if (num == 0)
3396 num = 1;
3398 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
3400 /* For each output operand, store a SET. */
3401 for (i = 0; i < noutputs; ++i)
3403 rtx src, o = output_rvec[i];
3404 if (i == 0)
3406 ASM_OPERANDS_OUTPUT_CONSTRAINT (obody) = constraints[0];
3407 src = obody;
3409 else
3411 src = gen_rtx_ASM_OPERANDS (GET_MODE (o),
3412 ASM_OPERANDS_TEMPLATE (obody),
3413 constraints[i], i, argvec,
3414 constraintvec, labelvec, locus);
3415 MEM_VOLATILE_P (src) = gimple_asm_volatile_p (stmt);
3417 XVECEXP (body, 0, i) = gen_rtx_SET (o, src);
3420 /* If there are no outputs (but there are some clobbers)
3421 store the bare ASM_OPERANDS into the PARALLEL. */
3422 if (i == 0)
3423 XVECEXP (body, 0, i++) = obody;
3425 /* Store (clobber REG) for each clobbered register specified. */
3426 for (unsigned j = 0; j < nclobbers; ++j)
3428 rtx clobbered_reg = clobber_rvec[j];
3430 /* Do sanity check for overlap between clobbers and respectively
3431 input and outputs that hasn't been handled. Such overlap
3432 should have been detected and reported above. */
3433 if (!clobber_conflict_found && REG_P (clobbered_reg))
3435 /* We test the old body (obody) contents to avoid
3436 tripping over the under-construction body. */
3437 for (unsigned k = 0; k < noutputs; ++k)
3438 if (reg_overlap_mentioned_p (clobbered_reg, output_rvec[k]))
3439 internal_error ("%<asm%> clobber conflict with "
3440 "output operand");
3442 for (unsigned k = 0; k < ninputs - ninout; ++k)
3443 if (reg_overlap_mentioned_p (clobbered_reg, input_rvec[k]))
3444 internal_error ("%<asm%> clobber conflict with "
3445 "input operand");
3448 XVECEXP (body, 0, i++) = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
3451 if (nlabels > 0)
3452 emit_jump_insn (body);
3453 else
3454 emit_insn (body);
3457 generating_concat_p = old_generating_concat_p;
3459 if (fallthru_label)
3460 emit_label (fallthru_label);
3462 if (after_md_seq)
3463 emit_insn (after_md_seq);
3464 if (after_rtl_seq)
3466 if (nlabels == 0)
3467 emit_insn (after_rtl_seq);
3468 else
3470 edge e;
3471 edge_iterator ei;
3473 FOR_EACH_EDGE (e, ei, gimple_bb (stmt)->succs)
3475 start_sequence ();
3476 for (rtx_insn *curr = after_rtl_seq;
3477 curr != NULL_RTX;
3478 curr = NEXT_INSN (curr))
3479 emit_insn (copy_insn (PATTERN (curr)));
3480 rtx_insn *copy = get_insns ();
3481 end_sequence ();
3482 insert_insn_on_edge (copy, e);
3487 free_temp_slots ();
3488 crtl->has_asm_statement = 1;
3491 /* Emit code to jump to the address
3492 specified by the pointer expression EXP. */
3494 static void
3495 expand_computed_goto (tree exp)
3497 rtx x = expand_normal (exp);
3499 do_pending_stack_adjust ();
3500 emit_indirect_jump (x);
3503 /* Generate RTL code for a `goto' statement with target label LABEL.
3504 LABEL should be a LABEL_DECL tree node that was or will later be
3505 defined with `expand_label'. */
3507 static void
3508 expand_goto (tree label)
3510 if (flag_checking)
3512 /* Check for a nonlocal goto to a containing function. Should have
3513 gotten translated to __builtin_nonlocal_goto. */
3514 tree context = decl_function_context (label);
3515 gcc_assert (!context || context == current_function_decl);
3518 emit_jump (jump_target_rtx (label));
3521 /* Output a return with no value. */
3523 static void
3524 expand_null_return_1 (void)
3526 clear_pending_stack_adjust ();
3527 do_pending_stack_adjust ();
3528 emit_jump (return_label);
3531 /* Generate RTL to return from the current function, with no value.
3532 (That is, we do not do anything about returning any value.) */
3534 void
3535 expand_null_return (void)
3537 /* If this function was declared to return a value, but we
3538 didn't, clobber the return registers so that they are not
3539 propagated live to the rest of the function. */
3540 clobber_return_register ();
3542 expand_null_return_1 ();
3545 /* Generate RTL to return from the current function, with value VAL. */
3547 static void
3548 expand_value_return (rtx val)
3550 /* Copy the value to the return location unless it's already there. */
3552 tree decl = DECL_RESULT (current_function_decl);
3553 rtx return_reg = DECL_RTL (decl);
3554 if (return_reg != val)
3556 tree funtype = TREE_TYPE (current_function_decl);
3557 tree type = TREE_TYPE (decl);
3558 int unsignedp = TYPE_UNSIGNED (type);
3559 machine_mode old_mode = DECL_MODE (decl);
3560 machine_mode mode;
3561 if (DECL_BY_REFERENCE (decl))
3562 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3563 else
3564 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3566 if (mode != old_mode)
3567 val = convert_modes (mode, old_mode, val, unsignedp);
3569 if (GET_CODE (return_reg) == PARALLEL)
3570 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3571 else
3572 emit_move_insn (return_reg, val);
3575 expand_null_return_1 ();
3578 /* Generate RTL to evaluate the expression RETVAL and return it
3579 from the current function. */
3581 static void
3582 expand_return (tree retval)
3584 rtx result_rtl;
3585 rtx val = 0;
3586 tree retval_rhs;
3588 /* If function wants no value, give it none. */
3589 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3591 expand_normal (retval);
3592 expand_null_return ();
3593 return;
3596 if (retval == error_mark_node)
3598 /* Treat this like a return of no value from a function that
3599 returns a value. */
3600 expand_null_return ();
3601 return;
3603 else if ((TREE_CODE (retval) == MODIFY_EXPR
3604 || TREE_CODE (retval) == INIT_EXPR)
3605 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3606 retval_rhs = TREE_OPERAND (retval, 1);
3607 else
3608 retval_rhs = retval;
3610 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3612 /* If we are returning the RESULT_DECL, then the value has already
3613 been stored into it, so we don't have to do anything special. */
3614 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3615 expand_value_return (result_rtl);
3617 /* If the result is an aggregate that is being returned in one (or more)
3618 registers, load the registers here. */
3620 else if (retval_rhs != 0
3621 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3622 && REG_P (result_rtl))
3624 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3625 if (val)
3627 /* Use the mode of the result value on the return register. */
3628 PUT_MODE (result_rtl, GET_MODE (val));
3629 expand_value_return (val);
3631 else
3632 expand_null_return ();
3634 else if (retval_rhs != 0
3635 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3636 && (REG_P (result_rtl)
3637 || (GET_CODE (result_rtl) == PARALLEL)))
3639 /* Compute the return value into a temporary (usually a pseudo reg). */
3641 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3642 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3643 val = force_not_mem (val);
3644 expand_value_return (val);
3646 else
3648 /* No hard reg used; calculate value into hard return reg. */
3649 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3650 expand_value_return (result_rtl);
3654 /* Expand a clobber of LHS. If LHS is stored it in a multi-part
3655 register, tell the rtl optimizers that its value is no longer
3656 needed. */
3658 static void
3659 expand_clobber (tree lhs)
3661 if (DECL_P (lhs))
3663 rtx decl_rtl = DECL_RTL_IF_SET (lhs);
3664 if (decl_rtl && REG_P (decl_rtl))
3666 machine_mode decl_mode = GET_MODE (decl_rtl);
3667 if (maybe_gt (GET_MODE_SIZE (decl_mode),
3668 REGMODE_NATURAL_SIZE (decl_mode)))
3669 emit_clobber (decl_rtl);
3674 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3675 STMT that doesn't require special handling for outgoing edges. That
3676 is no tailcalls and no GIMPLE_COND. */
3678 static void
3679 expand_gimple_stmt_1 (gimple *stmt)
3681 tree op0;
3683 set_curr_insn_location (gimple_location (stmt));
3685 switch (gimple_code (stmt))
3687 case GIMPLE_GOTO:
3688 op0 = gimple_goto_dest (stmt);
3689 if (TREE_CODE (op0) == LABEL_DECL)
3690 expand_goto (op0);
3691 else
3692 expand_computed_goto (op0);
3693 break;
3694 case GIMPLE_LABEL:
3695 expand_label (gimple_label_label (as_a <glabel *> (stmt)));
3696 break;
3697 case GIMPLE_NOP:
3698 case GIMPLE_PREDICT:
3699 break;
3700 case GIMPLE_SWITCH:
3702 gswitch *swtch = as_a <gswitch *> (stmt);
3703 if (gimple_switch_num_labels (swtch) == 1)
3704 expand_goto (CASE_LABEL (gimple_switch_default_label (swtch)));
3705 else
3706 expand_case (swtch);
3708 break;
3709 case GIMPLE_ASM:
3710 expand_asm_stmt (as_a <gasm *> (stmt));
3711 break;
3712 case GIMPLE_CALL:
3713 expand_call_stmt (as_a <gcall *> (stmt));
3714 break;
3716 case GIMPLE_RETURN:
3718 op0 = gimple_return_retval (as_a <greturn *> (stmt));
3720 /* If a return doesn't have a location, it very likely represents
3721 multiple user returns so we cannot let it inherit the location
3722 of the last statement of the previous basic block in RTL. */
3723 if (!gimple_has_location (stmt))
3724 set_curr_insn_location (cfun->function_end_locus);
3726 if (op0 && op0 != error_mark_node)
3728 tree result = DECL_RESULT (current_function_decl);
3730 /* If we are not returning the current function's RESULT_DECL,
3731 build an assignment to it. */
3732 if (op0 != result)
3734 /* I believe that a function's RESULT_DECL is unique. */
3735 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3737 /* ??? We'd like to use simply expand_assignment here,
3738 but this fails if the value is of BLKmode but the return
3739 decl is a register. expand_return has special handling
3740 for this combination, which eventually should move
3741 to common code. See comments there. Until then, let's
3742 build a modify expression :-/ */
3743 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3744 result, op0);
3748 if (!op0)
3749 expand_null_return ();
3750 else
3751 expand_return (op0);
3753 break;
3755 case GIMPLE_ASSIGN:
3757 gassign *assign_stmt = as_a <gassign *> (stmt);
3758 tree lhs = gimple_assign_lhs (assign_stmt);
3760 /* Tree expand used to fiddle with |= and &= of two bitfield
3761 COMPONENT_REFs here. This can't happen with gimple, the LHS
3762 of binary assigns must be a gimple reg. */
3764 if (TREE_CODE (lhs) != SSA_NAME
3765 || gimple_assign_rhs_class (assign_stmt) == GIMPLE_SINGLE_RHS)
3767 tree rhs = gimple_assign_rhs1 (assign_stmt);
3768 gcc_assert (gimple_assign_rhs_class (assign_stmt)
3769 == GIMPLE_SINGLE_RHS);
3770 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs)
3771 /* Do not put locations on possibly shared trees. */
3772 && !is_gimple_min_invariant (rhs))
3773 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3774 if (TREE_CLOBBER_P (rhs))
3775 /* This is a clobber to mark the going out of scope for
3776 this LHS. */
3777 expand_clobber (lhs);
3778 else
3779 expand_assignment (lhs, rhs,
3780 gimple_assign_nontemporal_move_p (
3781 assign_stmt));
3783 else
3785 rtx target, temp;
3786 bool nontemporal = gimple_assign_nontemporal_move_p (assign_stmt);
3787 struct separate_ops ops;
3788 bool promoted = false;
3790 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3791 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3792 promoted = true;
3794 ops.code = gimple_assign_rhs_code (assign_stmt);
3795 ops.type = TREE_TYPE (lhs);
3796 switch (get_gimple_rhs_class (ops.code))
3798 case GIMPLE_TERNARY_RHS:
3799 ops.op2 = gimple_assign_rhs3 (assign_stmt);
3800 /* Fallthru */
3801 case GIMPLE_BINARY_RHS:
3802 ops.op1 = gimple_assign_rhs2 (assign_stmt);
3803 /* Fallthru */
3804 case GIMPLE_UNARY_RHS:
3805 ops.op0 = gimple_assign_rhs1 (assign_stmt);
3806 break;
3807 default:
3808 gcc_unreachable ();
3810 ops.location = gimple_location (stmt);
3812 /* If we want to use a nontemporal store, force the value to
3813 register first. If we store into a promoted register,
3814 don't directly expand to target. */
3815 temp = nontemporal || promoted ? NULL_RTX : target;
3816 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3817 EXPAND_NORMAL);
3819 if (temp == target)
3821 else if (promoted)
3823 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3824 /* If TEMP is a VOIDmode constant, use convert_modes to make
3825 sure that we properly convert it. */
3826 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3828 temp = convert_modes (GET_MODE (target),
3829 TYPE_MODE (ops.type),
3830 temp, unsignedp);
3831 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3832 GET_MODE (target), temp, unsignedp);
3835 convert_move (SUBREG_REG (target), temp, unsignedp);
3837 else if (nontemporal && emit_storent_insn (target, temp))
3839 else
3841 temp = force_operand (temp, target);
3842 if (temp != target)
3843 emit_move_insn (target, temp);
3847 break;
3849 default:
3850 gcc_unreachable ();
3854 /* Expand one gimple statement STMT and return the last RTL instruction
3855 before any of the newly generated ones.
3857 In addition to generating the necessary RTL instructions this also
3858 sets REG_EH_REGION notes if necessary and sets the current source
3859 location for diagnostics. */
3861 static rtx_insn *
3862 expand_gimple_stmt (gimple *stmt)
3864 location_t saved_location = input_location;
3865 rtx_insn *last = get_last_insn ();
3866 int lp_nr;
3868 gcc_assert (cfun);
3870 /* We need to save and restore the current source location so that errors
3871 discovered during expansion are emitted with the right location. But
3872 it would be better if the diagnostic routines used the source location
3873 embedded in the tree nodes rather than globals. */
3874 if (gimple_has_location (stmt))
3875 input_location = gimple_location (stmt);
3877 expand_gimple_stmt_1 (stmt);
3879 /* Free any temporaries used to evaluate this statement. */
3880 free_temp_slots ();
3882 input_location = saved_location;
3884 /* Mark all insns that may trap. */
3885 lp_nr = lookup_stmt_eh_lp (stmt);
3886 if (lp_nr)
3888 rtx_insn *insn;
3889 for (insn = next_real_insn (last); insn;
3890 insn = next_real_insn (insn))
3892 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3893 /* If we want exceptions for non-call insns, any
3894 may_trap_p instruction may throw. */
3895 && GET_CODE (PATTERN (insn)) != CLOBBER
3896 && GET_CODE (PATTERN (insn)) != USE
3897 && insn_could_throw_p (insn))
3898 make_reg_eh_region_note (insn, 0, lp_nr);
3902 return last;
3905 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3906 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3907 generated a tail call (something that might be denied by the ABI
3908 rules governing the call; see calls.c).
3910 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3911 can still reach the rest of BB. The case here is __builtin_sqrt,
3912 where the NaN result goes through the external function (with a
3913 tailcall) and the normal result happens via a sqrt instruction. */
3915 static basic_block
3916 expand_gimple_tailcall (basic_block bb, gcall *stmt, bool *can_fallthru)
3918 rtx_insn *last2, *last;
3919 edge e;
3920 edge_iterator ei;
3921 profile_probability probability;
3923 last2 = last = expand_gimple_stmt (stmt);
3925 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3926 if (CALL_P (last) && SIBLING_CALL_P (last))
3927 goto found;
3929 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3931 *can_fallthru = true;
3932 return NULL;
3934 found:
3935 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3936 Any instructions emitted here are about to be deleted. */
3937 do_pending_stack_adjust ();
3939 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3940 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3941 EH or abnormal edges, we shouldn't have created a tail call in
3942 the first place. So it seems to me we should just be removing
3943 all edges here, or redirecting the existing fallthru edge to
3944 the exit block. */
3946 probability = profile_probability::never ();
3948 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3950 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3952 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3953 e->dest->count -= e->count ();
3954 probability += e->probability;
3955 remove_edge (e);
3957 else
3958 ei_next (&ei);
3961 /* This is somewhat ugly: the call_expr expander often emits instructions
3962 after the sibcall (to perform the function return). These confuse the
3963 find_many_sub_basic_blocks code, so we need to get rid of these. */
3964 last = NEXT_INSN (last);
3965 gcc_assert (BARRIER_P (last));
3967 *can_fallthru = false;
3968 while (NEXT_INSN (last))
3970 /* For instance an sqrt builtin expander expands if with
3971 sibcall in the then and label for `else`. */
3972 if (LABEL_P (NEXT_INSN (last)))
3974 *can_fallthru = true;
3975 break;
3977 delete_insn (NEXT_INSN (last));
3980 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3981 | EDGE_SIBCALL);
3982 e->probability = probability;
3983 BB_END (bb) = last;
3984 update_bb_for_insn (bb);
3986 if (NEXT_INSN (last))
3988 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3990 last = BB_END (bb);
3991 if (BARRIER_P (last))
3992 BB_END (bb) = PREV_INSN (last);
3995 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3997 return bb;
4000 /* Return the difference between the floor and the truncated result of
4001 a signed division by OP1 with remainder MOD. */
4002 static rtx
4003 floor_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4005 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
4006 return gen_rtx_IF_THEN_ELSE
4007 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4008 gen_rtx_IF_THEN_ELSE
4009 (mode, gen_rtx_LT (BImode,
4010 gen_rtx_DIV (mode, op1, mod),
4011 const0_rtx),
4012 constm1_rtx, const0_rtx),
4013 const0_rtx);
4016 /* Return the difference between the ceil and the truncated result of
4017 a signed division by OP1 with remainder MOD. */
4018 static rtx
4019 ceil_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4021 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
4022 return gen_rtx_IF_THEN_ELSE
4023 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4024 gen_rtx_IF_THEN_ELSE
4025 (mode, gen_rtx_GT (BImode,
4026 gen_rtx_DIV (mode, op1, mod),
4027 const0_rtx),
4028 const1_rtx, const0_rtx),
4029 const0_rtx);
4032 /* Return the difference between the ceil and the truncated result of
4033 an unsigned division by OP1 with remainder MOD. */
4034 static rtx
4035 ceil_udiv_adjust (machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
4037 /* (mod != 0 ? 1 : 0) */
4038 return gen_rtx_IF_THEN_ELSE
4039 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
4040 const1_rtx, const0_rtx);
4043 /* Return the difference between the rounded and the truncated result
4044 of a signed division by OP1 with remainder MOD. Halfway cases are
4045 rounded away from zero, rather than to the nearest even number. */
4046 static rtx
4047 round_sdiv_adjust (machine_mode mode, rtx mod, rtx op1)
4049 /* (abs (mod) >= abs (op1) - abs (mod)
4050 ? (op1 / mod > 0 ? 1 : -1)
4051 : 0) */
4052 return gen_rtx_IF_THEN_ELSE
4053 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
4054 gen_rtx_MINUS (mode,
4055 gen_rtx_ABS (mode, op1),
4056 gen_rtx_ABS (mode, mod))),
4057 gen_rtx_IF_THEN_ELSE
4058 (mode, gen_rtx_GT (BImode,
4059 gen_rtx_DIV (mode, op1, mod),
4060 const0_rtx),
4061 const1_rtx, constm1_rtx),
4062 const0_rtx);
4065 /* Return the difference between the rounded and the truncated result
4066 of a unsigned division by OP1 with remainder MOD. Halfway cases
4067 are rounded away from zero, rather than to the nearest even
4068 number. */
4069 static rtx
4070 round_udiv_adjust (machine_mode mode, rtx mod, rtx op1)
4072 /* (mod >= op1 - mod ? 1 : 0) */
4073 return gen_rtx_IF_THEN_ELSE
4074 (mode, gen_rtx_GE (BImode, mod,
4075 gen_rtx_MINUS (mode, op1, mod)),
4076 const1_rtx, const0_rtx);
4079 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
4080 any rtl. */
4082 static rtx
4083 convert_debug_memory_address (scalar_int_mode mode, rtx x,
4084 addr_space_t as)
4086 #ifndef POINTERS_EXTEND_UNSIGNED
4087 gcc_assert (mode == Pmode
4088 || mode == targetm.addr_space.address_mode (as));
4089 gcc_assert (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode);
4090 #else
4091 rtx temp;
4093 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
4095 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
4096 return x;
4098 /* X must have some form of address mode already. */
4099 scalar_int_mode xmode = as_a <scalar_int_mode> (GET_MODE (x));
4100 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
4101 x = lowpart_subreg (mode, x, xmode);
4102 else if (POINTERS_EXTEND_UNSIGNED > 0)
4103 x = gen_rtx_ZERO_EXTEND (mode, x);
4104 else if (!POINTERS_EXTEND_UNSIGNED)
4105 x = gen_rtx_SIGN_EXTEND (mode, x);
4106 else
4108 switch (GET_CODE (x))
4110 case SUBREG:
4111 if ((SUBREG_PROMOTED_VAR_P (x)
4112 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
4113 || (GET_CODE (SUBREG_REG (x)) == PLUS
4114 && REG_P (XEXP (SUBREG_REG (x), 0))
4115 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
4116 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
4117 && GET_MODE (SUBREG_REG (x)) == mode)
4118 return SUBREG_REG (x);
4119 break;
4120 case LABEL_REF:
4121 temp = gen_rtx_LABEL_REF (mode, label_ref_label (x));
4122 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
4123 return temp;
4124 case SYMBOL_REF:
4125 temp = shallow_copy_rtx (x);
4126 PUT_MODE (temp, mode);
4127 return temp;
4128 case CONST:
4129 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4130 if (temp)
4131 temp = gen_rtx_CONST (mode, temp);
4132 return temp;
4133 case PLUS:
4134 case MINUS:
4135 if (CONST_INT_P (XEXP (x, 1)))
4137 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
4138 if (temp)
4139 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
4141 break;
4142 default:
4143 break;
4145 /* Don't know how to express ptr_extend as operation in debug info. */
4146 return NULL;
4148 #endif /* POINTERS_EXTEND_UNSIGNED */
4150 return x;
4153 /* Map from SSA_NAMEs to corresponding DEBUG_EXPR_DECLs created
4154 by avoid_deep_ter_for_debug. */
4156 static hash_map<tree, tree> *deep_ter_debug_map;
4158 /* Split too deep TER chains for debug stmts using debug temporaries. */
4160 static void
4161 avoid_deep_ter_for_debug (gimple *stmt, int depth)
4163 use_operand_p use_p;
4164 ssa_op_iter iter;
4165 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
4167 tree use = USE_FROM_PTR (use_p);
4168 if (TREE_CODE (use) != SSA_NAME || SSA_NAME_IS_DEFAULT_DEF (use))
4169 continue;
4170 gimple *g = get_gimple_for_ssa_name (use);
4171 if (g == NULL)
4172 continue;
4173 if (depth > 6 && !stmt_ends_bb_p (g))
4175 if (deep_ter_debug_map == NULL)
4176 deep_ter_debug_map = new hash_map<tree, tree>;
4178 tree &vexpr = deep_ter_debug_map->get_or_insert (use);
4179 if (vexpr != NULL)
4180 continue;
4181 vexpr = make_node (DEBUG_EXPR_DECL);
4182 gimple *def_temp = gimple_build_debug_bind (vexpr, use, g);
4183 DECL_ARTIFICIAL (vexpr) = 1;
4184 TREE_TYPE (vexpr) = TREE_TYPE (use);
4185 SET_DECL_MODE (vexpr, TYPE_MODE (TREE_TYPE (use)));
4186 gimple_stmt_iterator gsi = gsi_for_stmt (g);
4187 gsi_insert_after (&gsi, def_temp, GSI_NEW_STMT);
4188 avoid_deep_ter_for_debug (def_temp, 0);
4190 else
4191 avoid_deep_ter_for_debug (g, depth + 1);
4195 /* Return an RTX equivalent to the value of the parameter DECL. */
4197 static rtx
4198 expand_debug_parm_decl (tree decl)
4200 rtx incoming = DECL_INCOMING_RTL (decl);
4202 if (incoming
4203 && GET_MODE (incoming) != BLKmode
4204 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
4205 || (MEM_P (incoming)
4206 && REG_P (XEXP (incoming, 0))
4207 && HARD_REGISTER_P (XEXP (incoming, 0)))))
4209 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
4211 #ifdef HAVE_window_save
4212 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
4213 If the target machine has an explicit window save instruction, the
4214 actual entry value is the corresponding OUTGOING_REGNO instead. */
4215 if (REG_P (incoming)
4216 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
4217 incoming
4218 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
4219 OUTGOING_REGNO (REGNO (incoming)), 0);
4220 else if (MEM_P (incoming))
4222 rtx reg = XEXP (incoming, 0);
4223 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
4225 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
4226 incoming = replace_equiv_address_nv (incoming, reg);
4228 else
4229 incoming = copy_rtx (incoming);
4231 #endif
4233 ENTRY_VALUE_EXP (rtl) = incoming;
4234 return rtl;
4237 if (incoming
4238 && GET_MODE (incoming) != BLKmode
4239 && !TREE_ADDRESSABLE (decl)
4240 && MEM_P (incoming)
4241 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
4242 || (GET_CODE (XEXP (incoming, 0)) == PLUS
4243 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
4244 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
4245 return copy_rtx (incoming);
4247 return NULL_RTX;
4250 /* Return an RTX equivalent to the value of the tree expression EXP. */
4252 static rtx
4253 expand_debug_expr (tree exp)
4255 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
4256 machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
4257 machine_mode inner_mode = VOIDmode;
4258 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
4259 addr_space_t as;
4260 scalar_int_mode op0_mode, op1_mode, addr_mode;
4262 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
4264 case tcc_expression:
4265 switch (TREE_CODE (exp))
4267 case COND_EXPR:
4268 case DOT_PROD_EXPR:
4269 case SAD_EXPR:
4270 case WIDEN_MULT_PLUS_EXPR:
4271 case WIDEN_MULT_MINUS_EXPR:
4272 goto ternary;
4274 case TRUTH_ANDIF_EXPR:
4275 case TRUTH_ORIF_EXPR:
4276 case TRUTH_AND_EXPR:
4277 case TRUTH_OR_EXPR:
4278 case TRUTH_XOR_EXPR:
4279 goto binary;
4281 case TRUTH_NOT_EXPR:
4282 goto unary;
4284 default:
4285 break;
4287 break;
4289 ternary:
4290 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
4291 if (!op2)
4292 return NULL_RTX;
4293 /* Fall through. */
4295 binary:
4296 case tcc_binary:
4297 if (mode == BLKmode)
4298 return NULL_RTX;
4299 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4300 if (!op1)
4301 return NULL_RTX;
4302 switch (TREE_CODE (exp))
4304 case LSHIFT_EXPR:
4305 case RSHIFT_EXPR:
4306 case LROTATE_EXPR:
4307 case RROTATE_EXPR:
4308 case WIDEN_LSHIFT_EXPR:
4309 /* Ensure second operand isn't wider than the first one. */
4310 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 1)));
4311 if (is_a <scalar_int_mode> (inner_mode, &op1_mode)
4312 && (GET_MODE_UNIT_PRECISION (mode)
4313 < GET_MODE_PRECISION (op1_mode)))
4314 op1 = lowpart_subreg (GET_MODE_INNER (mode), op1, op1_mode);
4315 break;
4316 default:
4317 break;
4319 /* Fall through. */
4321 unary:
4322 case tcc_unary:
4323 if (mode == BLKmode)
4324 return NULL_RTX;
4325 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4326 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4327 if (!op0)
4328 return NULL_RTX;
4329 break;
4331 case tcc_comparison:
4332 unsignedp = TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)));
4333 goto binary;
4335 case tcc_type:
4336 case tcc_statement:
4337 gcc_unreachable ();
4339 case tcc_constant:
4340 case tcc_exceptional:
4341 case tcc_declaration:
4342 case tcc_reference:
4343 case tcc_vl_exp:
4344 break;
4347 switch (TREE_CODE (exp))
4349 case STRING_CST:
4350 if (!lookup_constant_def (exp))
4352 if (strlen (TREE_STRING_POINTER (exp)) + 1
4353 != (size_t) TREE_STRING_LENGTH (exp))
4354 return NULL_RTX;
4355 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
4356 op0 = gen_rtx_MEM (BLKmode, op0);
4357 set_mem_attributes (op0, exp, 0);
4358 return op0;
4360 /* Fall through. */
4362 case INTEGER_CST:
4363 case REAL_CST:
4364 case FIXED_CST:
4365 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
4366 return op0;
4368 case POLY_INT_CST:
4369 return immed_wide_int_const (poly_int_cst_value (exp), mode);
4371 case COMPLEX_CST:
4372 gcc_assert (COMPLEX_MODE_P (mode));
4373 op0 = expand_debug_expr (TREE_REALPART (exp));
4374 op1 = expand_debug_expr (TREE_IMAGPART (exp));
4375 return gen_rtx_CONCAT (mode, op0, op1);
4377 case DEBUG_EXPR_DECL:
4378 op0 = DECL_RTL_IF_SET (exp);
4380 if (op0)
4381 return op0;
4383 op0 = gen_rtx_DEBUG_EXPR (mode);
4384 DEBUG_EXPR_TREE_DECL (op0) = exp;
4385 SET_DECL_RTL (exp, op0);
4387 return op0;
4389 case VAR_DECL:
4390 case PARM_DECL:
4391 case FUNCTION_DECL:
4392 case LABEL_DECL:
4393 case CONST_DECL:
4394 case RESULT_DECL:
4395 op0 = DECL_RTL_IF_SET (exp);
4397 /* This decl was probably optimized away. */
4398 if (!op0
4399 /* At least label RTXen are sometimes replaced by
4400 NOTE_INSN_DELETED_LABEL. Any notes here are not
4401 handled by copy_rtx. */
4402 || NOTE_P (op0))
4404 if (!VAR_P (exp)
4405 || DECL_EXTERNAL (exp)
4406 || !TREE_STATIC (exp)
4407 || !DECL_NAME (exp)
4408 || DECL_HARD_REGISTER (exp)
4409 || DECL_IN_CONSTANT_POOL (exp)
4410 || mode == VOIDmode)
4411 return NULL;
4413 op0 = make_decl_rtl_for_debug (exp);
4414 if (!MEM_P (op0)
4415 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
4416 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
4417 return NULL;
4419 else
4420 op0 = copy_rtx (op0);
4422 if (GET_MODE (op0) == BLKmode
4423 /* If op0 is not BLKmode, but mode is, adjust_mode
4424 below would ICE. While it is likely a FE bug,
4425 try to be robust here. See PR43166. */
4426 || mode == BLKmode
4427 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
4429 gcc_assert (MEM_P (op0));
4430 op0 = adjust_address_nv (op0, mode, 0);
4431 return op0;
4434 /* Fall through. */
4436 adjust_mode:
4437 case PAREN_EXPR:
4438 CASE_CONVERT:
4440 inner_mode = GET_MODE (op0);
4442 if (mode == inner_mode)
4443 return op0;
4445 if (inner_mode == VOIDmode)
4447 if (TREE_CODE (exp) == SSA_NAME)
4448 inner_mode = TYPE_MODE (TREE_TYPE (exp));
4449 else
4450 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4451 if (mode == inner_mode)
4452 return op0;
4455 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4457 if (GET_MODE_UNIT_BITSIZE (mode)
4458 == GET_MODE_UNIT_BITSIZE (inner_mode))
4459 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4460 else if (GET_MODE_UNIT_BITSIZE (mode)
4461 < GET_MODE_UNIT_BITSIZE (inner_mode))
4462 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4463 else
4464 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4466 else if (FLOAT_MODE_P (mode))
4468 gcc_assert (TREE_CODE (exp) != SSA_NAME);
4469 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4470 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
4471 else
4472 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
4474 else if (FLOAT_MODE_P (inner_mode))
4476 if (unsignedp)
4477 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4478 else
4479 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4481 else if (GET_MODE_UNIT_PRECISION (mode)
4482 == GET_MODE_UNIT_PRECISION (inner_mode))
4483 op0 = lowpart_subreg (mode, op0, inner_mode);
4484 else if (GET_MODE_UNIT_PRECISION (mode)
4485 < GET_MODE_UNIT_PRECISION (inner_mode))
4486 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
4487 else if (UNARY_CLASS_P (exp)
4488 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
4489 : unsignedp)
4490 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4491 else
4492 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4494 return op0;
4497 case MEM_REF:
4498 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4500 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
4501 TREE_OPERAND (exp, 0),
4502 TREE_OPERAND (exp, 1));
4503 if (newexp)
4504 return expand_debug_expr (newexp);
4506 /* FALLTHROUGH */
4507 case INDIRECT_REF:
4508 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
4509 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4510 if (!op0)
4511 return NULL;
4513 if (TREE_CODE (exp) == MEM_REF)
4515 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4516 || (GET_CODE (op0) == PLUS
4517 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
4518 /* (mem (debug_implicit_ptr)) might confuse aliasing.
4519 Instead just use get_inner_reference. */
4520 goto component_ref;
4522 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
4523 poly_int64 offset;
4524 if (!op1 || !poly_int_rtx_p (op1, &offset))
4525 return NULL;
4527 op0 = plus_constant (inner_mode, op0, offset);
4530 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4532 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4533 op0, as);
4534 if (op0 == NULL_RTX)
4535 return NULL;
4537 op0 = gen_rtx_MEM (mode, op0);
4538 set_mem_attributes (op0, exp, 0);
4539 if (TREE_CODE (exp) == MEM_REF
4540 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
4541 set_mem_expr (op0, NULL_TREE);
4542 set_mem_addr_space (op0, as);
4544 return op0;
4546 case TARGET_MEM_REF:
4547 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
4548 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
4549 return NULL;
4551 op0 = expand_debug_expr
4552 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
4553 if (!op0)
4554 return NULL;
4556 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
4557 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
4558 op0, as);
4559 if (op0 == NULL_RTX)
4560 return NULL;
4562 op0 = gen_rtx_MEM (mode, op0);
4564 set_mem_attributes (op0, exp, 0);
4565 set_mem_addr_space (op0, as);
4567 return op0;
4569 component_ref:
4570 case ARRAY_REF:
4571 case ARRAY_RANGE_REF:
4572 case COMPONENT_REF:
4573 case BIT_FIELD_REF:
4574 case REALPART_EXPR:
4575 case IMAGPART_EXPR:
4576 case VIEW_CONVERT_EXPR:
4578 machine_mode mode1;
4579 poly_int64 bitsize, bitpos;
4580 tree offset;
4581 int reversep, volatilep = 0;
4582 tree tem
4583 = get_inner_reference (exp, &bitsize, &bitpos, &offset, &mode1,
4584 &unsignedp, &reversep, &volatilep);
4585 rtx orig_op0;
4587 if (known_eq (bitsize, 0))
4588 return NULL;
4590 orig_op0 = op0 = expand_debug_expr (tem);
4592 if (!op0)
4593 return NULL;
4595 if (offset)
4597 machine_mode addrmode, offmode;
4599 if (!MEM_P (op0))
4600 return NULL;
4602 op0 = XEXP (op0, 0);
4603 addrmode = GET_MODE (op0);
4604 if (addrmode == VOIDmode)
4605 addrmode = Pmode;
4607 op1 = expand_debug_expr (offset);
4608 if (!op1)
4609 return NULL;
4611 offmode = GET_MODE (op1);
4612 if (offmode == VOIDmode)
4613 offmode = TYPE_MODE (TREE_TYPE (offset));
4615 if (addrmode != offmode)
4616 op1 = lowpart_subreg (addrmode, op1, offmode);
4618 /* Don't use offset_address here, we don't need a
4619 recognizable address, and we don't want to generate
4620 code. */
4621 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4622 op0, op1));
4625 if (MEM_P (op0))
4627 if (mode1 == VOIDmode)
4629 if (maybe_gt (bitsize, MAX_BITSIZE_MODE_ANY_INT))
4630 return NULL;
4631 /* Bitfield. */
4632 mode1 = smallest_int_mode_for_size (bitsize);
4634 poly_int64 bytepos = bits_to_bytes_round_down (bitpos);
4635 if (maybe_ne (bytepos, 0))
4637 op0 = adjust_address_nv (op0, mode1, bytepos);
4638 bitpos = num_trailing_bits (bitpos);
4640 else if (known_eq (bitpos, 0)
4641 && known_eq (bitsize, GET_MODE_BITSIZE (mode)))
4642 op0 = adjust_address_nv (op0, mode, 0);
4643 else if (GET_MODE (op0) != mode1)
4644 op0 = adjust_address_nv (op0, mode1, 0);
4645 else
4646 op0 = copy_rtx (op0);
4647 if (op0 == orig_op0)
4648 op0 = shallow_copy_rtx (op0);
4649 if (TREE_CODE (tem) != SSA_NAME)
4650 set_mem_attributes (op0, exp, 0);
4653 if (known_eq (bitpos, 0) && mode == GET_MODE (op0))
4654 return op0;
4656 if (maybe_lt (bitpos, 0))
4657 return NULL;
4659 if (GET_MODE (op0) == BLKmode || mode == BLKmode)
4660 return NULL;
4662 poly_int64 bytepos;
4663 if (multiple_p (bitpos, BITS_PER_UNIT, &bytepos)
4664 && known_eq (bitsize, GET_MODE_BITSIZE (mode1)))
4666 machine_mode opmode = GET_MODE (op0);
4668 if (opmode == VOIDmode)
4669 opmode = TYPE_MODE (TREE_TYPE (tem));
4671 /* This condition may hold if we're expanding the address
4672 right past the end of an array that turned out not to
4673 be addressable (i.e., the address was only computed in
4674 debug stmts). The gen_subreg below would rightfully
4675 crash, and the address doesn't really exist, so just
4676 drop it. */
4677 if (known_ge (bitpos, GET_MODE_BITSIZE (opmode)))
4678 return NULL;
4680 if (multiple_p (bitpos, GET_MODE_BITSIZE (mode)))
4681 return simplify_gen_subreg (mode, op0, opmode, bytepos);
4684 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4685 && TYPE_UNSIGNED (TREE_TYPE (exp))
4686 ? SIGN_EXTRACT
4687 : ZERO_EXTRACT, mode,
4688 GET_MODE (op0) != VOIDmode
4689 ? GET_MODE (op0)
4690 : TYPE_MODE (TREE_TYPE (tem)),
4691 op0, gen_int_mode (bitsize, word_mode),
4692 gen_int_mode (bitpos, word_mode));
4695 case ABS_EXPR:
4696 case ABSU_EXPR:
4697 return simplify_gen_unary (ABS, mode, op0, mode);
4699 case NEGATE_EXPR:
4700 return simplify_gen_unary (NEG, mode, op0, mode);
4702 case BIT_NOT_EXPR:
4703 return simplify_gen_unary (NOT, mode, op0, mode);
4705 case FLOAT_EXPR:
4706 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4707 0)))
4708 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4709 inner_mode);
4711 case FIX_TRUNC_EXPR:
4712 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4713 inner_mode);
4715 case POINTER_PLUS_EXPR:
4716 /* For the rare target where pointers are not the same size as
4717 size_t, we need to check for mis-matched modes and correct
4718 the addend. */
4719 if (op0 && op1
4720 && is_a <scalar_int_mode> (GET_MODE (op0), &op0_mode)
4721 && is_a <scalar_int_mode> (GET_MODE (op1), &op1_mode)
4722 && op0_mode != op1_mode)
4724 if (GET_MODE_BITSIZE (op0_mode) < GET_MODE_BITSIZE (op1_mode)
4725 /* If OP0 is a partial mode, then we must truncate, even
4726 if it has the same bitsize as OP1 as GCC's
4727 representation of partial modes is opaque. */
4728 || (GET_MODE_CLASS (op0_mode) == MODE_PARTIAL_INT
4729 && (GET_MODE_BITSIZE (op0_mode)
4730 == GET_MODE_BITSIZE (op1_mode))))
4731 op1 = simplify_gen_unary (TRUNCATE, op0_mode, op1, op1_mode);
4732 else
4733 /* We always sign-extend, regardless of the signedness of
4734 the operand, because the operand is always unsigned
4735 here even if the original C expression is signed. */
4736 op1 = simplify_gen_unary (SIGN_EXTEND, op0_mode, op1, op1_mode);
4738 /* Fall through. */
4739 case PLUS_EXPR:
4740 return simplify_gen_binary (PLUS, mode, op0, op1);
4742 case MINUS_EXPR:
4743 case POINTER_DIFF_EXPR:
4744 return simplify_gen_binary (MINUS, mode, op0, op1);
4746 case MULT_EXPR:
4747 return simplify_gen_binary (MULT, mode, op0, op1);
4749 case RDIV_EXPR:
4750 case TRUNC_DIV_EXPR:
4751 case EXACT_DIV_EXPR:
4752 if (unsignedp)
4753 return simplify_gen_binary (UDIV, mode, op0, op1);
4754 else
4755 return simplify_gen_binary (DIV, mode, op0, op1);
4757 case TRUNC_MOD_EXPR:
4758 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4760 case FLOOR_DIV_EXPR:
4761 if (unsignedp)
4762 return simplify_gen_binary (UDIV, mode, op0, op1);
4763 else
4765 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4766 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4767 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4768 return simplify_gen_binary (PLUS, mode, div, adj);
4771 case FLOOR_MOD_EXPR:
4772 if (unsignedp)
4773 return simplify_gen_binary (UMOD, mode, op0, op1);
4774 else
4776 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4777 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4778 adj = simplify_gen_unary (NEG, mode,
4779 simplify_gen_binary (MULT, mode, adj, op1),
4780 mode);
4781 return simplify_gen_binary (PLUS, mode, mod, adj);
4784 case CEIL_DIV_EXPR:
4785 if (unsignedp)
4787 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4788 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4789 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4790 return simplify_gen_binary (PLUS, mode, div, adj);
4792 else
4794 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4795 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4796 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4797 return simplify_gen_binary (PLUS, mode, div, adj);
4800 case CEIL_MOD_EXPR:
4801 if (unsignedp)
4803 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4804 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4805 adj = simplify_gen_unary (NEG, mode,
4806 simplify_gen_binary (MULT, mode, adj, op1),
4807 mode);
4808 return simplify_gen_binary (PLUS, mode, mod, adj);
4810 else
4812 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4813 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4814 adj = simplify_gen_unary (NEG, mode,
4815 simplify_gen_binary (MULT, mode, adj, op1),
4816 mode);
4817 return simplify_gen_binary (PLUS, mode, mod, adj);
4820 case ROUND_DIV_EXPR:
4821 if (unsignedp)
4823 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4824 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4825 rtx adj = round_udiv_adjust (mode, mod, op1);
4826 return simplify_gen_binary (PLUS, mode, div, adj);
4828 else
4830 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4831 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4832 rtx adj = round_sdiv_adjust (mode, mod, op1);
4833 return simplify_gen_binary (PLUS, mode, div, adj);
4836 case ROUND_MOD_EXPR:
4837 if (unsignedp)
4839 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4840 rtx adj = round_udiv_adjust (mode, mod, op1);
4841 adj = simplify_gen_unary (NEG, mode,
4842 simplify_gen_binary (MULT, mode, adj, op1),
4843 mode);
4844 return simplify_gen_binary (PLUS, mode, mod, adj);
4846 else
4848 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4849 rtx adj = round_sdiv_adjust (mode, mod, op1);
4850 adj = simplify_gen_unary (NEG, mode,
4851 simplify_gen_binary (MULT, mode, adj, op1),
4852 mode);
4853 return simplify_gen_binary (PLUS, mode, mod, adj);
4856 case LSHIFT_EXPR:
4857 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4859 case RSHIFT_EXPR:
4860 if (unsignedp)
4861 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4862 else
4863 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4865 case LROTATE_EXPR:
4866 return simplify_gen_binary (ROTATE, mode, op0, op1);
4868 case RROTATE_EXPR:
4869 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4871 case MIN_EXPR:
4872 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4874 case MAX_EXPR:
4875 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4877 case BIT_AND_EXPR:
4878 case TRUTH_AND_EXPR:
4879 return simplify_gen_binary (AND, mode, op0, op1);
4881 case BIT_IOR_EXPR:
4882 case TRUTH_OR_EXPR:
4883 return simplify_gen_binary (IOR, mode, op0, op1);
4885 case BIT_XOR_EXPR:
4886 case TRUTH_XOR_EXPR:
4887 return simplify_gen_binary (XOR, mode, op0, op1);
4889 case TRUTH_ANDIF_EXPR:
4890 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4892 case TRUTH_ORIF_EXPR:
4893 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4895 case TRUTH_NOT_EXPR:
4896 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4898 case LT_EXPR:
4899 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4900 op0, op1);
4902 case LE_EXPR:
4903 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4904 op0, op1);
4906 case GT_EXPR:
4907 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4908 op0, op1);
4910 case GE_EXPR:
4911 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4912 op0, op1);
4914 case EQ_EXPR:
4915 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4917 case NE_EXPR:
4918 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4920 case UNORDERED_EXPR:
4921 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4923 case ORDERED_EXPR:
4924 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4926 case UNLT_EXPR:
4927 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4929 case UNLE_EXPR:
4930 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4932 case UNGT_EXPR:
4933 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4935 case UNGE_EXPR:
4936 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4938 case UNEQ_EXPR:
4939 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4941 case LTGT_EXPR:
4942 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4944 case COND_EXPR:
4945 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4947 case COMPLEX_EXPR:
4948 gcc_assert (COMPLEX_MODE_P (mode));
4949 if (GET_MODE (op0) == VOIDmode)
4950 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4951 if (GET_MODE (op1) == VOIDmode)
4952 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4953 return gen_rtx_CONCAT (mode, op0, op1);
4955 case CONJ_EXPR:
4956 if (GET_CODE (op0) == CONCAT)
4957 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4958 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4959 XEXP (op0, 1),
4960 GET_MODE_INNER (mode)));
4961 else
4963 scalar_mode imode = GET_MODE_INNER (mode);
4964 rtx re, im;
4966 if (MEM_P (op0))
4968 re = adjust_address_nv (op0, imode, 0);
4969 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4971 else
4973 scalar_int_mode ifmode;
4974 scalar_int_mode ihmode;
4975 rtx halfsize;
4976 if (!int_mode_for_mode (mode).exists (&ifmode)
4977 || !int_mode_for_mode (imode).exists (&ihmode))
4978 return NULL;
4979 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4980 re = op0;
4981 if (mode != ifmode)
4982 re = gen_rtx_SUBREG (ifmode, re, 0);
4983 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4984 if (imode != ihmode)
4985 re = gen_rtx_SUBREG (imode, re, 0);
4986 im = copy_rtx (op0);
4987 if (mode != ifmode)
4988 im = gen_rtx_SUBREG (ifmode, im, 0);
4989 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4990 if (imode != ihmode)
4991 im = gen_rtx_SUBREG (imode, im, 0);
4993 im = gen_rtx_NEG (imode, im);
4994 return gen_rtx_CONCAT (mode, re, im);
4997 case ADDR_EXPR:
4998 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4999 if (!op0 || !MEM_P (op0))
5001 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
5002 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
5003 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
5004 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
5005 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
5006 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
5008 if (handled_component_p (TREE_OPERAND (exp, 0)))
5010 poly_int64 bitoffset, bitsize, maxsize, byteoffset;
5011 bool reverse;
5012 tree decl
5013 = get_ref_base_and_extent (TREE_OPERAND (exp, 0), &bitoffset,
5014 &bitsize, &maxsize, &reverse);
5015 if ((VAR_P (decl)
5016 || TREE_CODE (decl) == PARM_DECL
5017 || TREE_CODE (decl) == RESULT_DECL)
5018 && (!TREE_ADDRESSABLE (decl)
5019 || target_for_debug_bind (decl))
5020 && multiple_p (bitoffset, BITS_PER_UNIT, &byteoffset)
5021 && known_gt (bitsize, 0)
5022 && known_eq (bitsize, maxsize))
5024 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
5025 return plus_constant (mode, base, byteoffset);
5029 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
5030 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
5031 == ADDR_EXPR)
5033 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5034 0));
5035 if (op0 != NULL
5036 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
5037 || (GET_CODE (op0) == PLUS
5038 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
5039 && CONST_INT_P (XEXP (op0, 1)))))
5041 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
5042 1));
5043 poly_int64 offset;
5044 if (!op1 || !poly_int_rtx_p (op1, &offset))
5045 return NULL;
5047 return plus_constant (mode, op0, offset);
5051 return NULL;
5054 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
5055 addr_mode = SCALAR_INT_TYPE_MODE (TREE_TYPE (exp));
5056 op0 = convert_debug_memory_address (addr_mode, XEXP (op0, 0), as);
5058 return op0;
5060 case VECTOR_CST:
5062 unsigned HOST_WIDE_INT i, nelts;
5064 if (!VECTOR_CST_NELTS (exp).is_constant (&nelts))
5065 return NULL;
5067 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5069 for (i = 0; i < nelts; ++i)
5071 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
5072 if (!op1)
5073 return NULL;
5074 XVECEXP (op0, 0, i) = op1;
5077 return op0;
5080 case CONSTRUCTOR:
5081 if (TREE_CLOBBER_P (exp))
5082 return NULL;
5083 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
5085 unsigned i;
5086 unsigned HOST_WIDE_INT nelts;
5087 tree val;
5089 if (!TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)).is_constant (&nelts))
5090 goto flag_unsupported;
5092 op0 = gen_rtx_CONCATN (mode, rtvec_alloc (nelts));
5094 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
5096 op1 = expand_debug_expr (val);
5097 if (!op1)
5098 return NULL;
5099 XVECEXP (op0, 0, i) = op1;
5102 if (i < nelts)
5104 op1 = expand_debug_expr
5105 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
5107 if (!op1)
5108 return NULL;
5110 for (; i < nelts; i++)
5111 XVECEXP (op0, 0, i) = op1;
5114 return op0;
5116 else
5117 goto flag_unsupported;
5119 case CALL_EXPR:
5120 /* ??? Maybe handle some builtins? */
5121 return NULL;
5123 case SSA_NAME:
5125 gimple *g = get_gimple_for_ssa_name (exp);
5126 if (g)
5128 tree t = NULL_TREE;
5129 if (deep_ter_debug_map)
5131 tree *slot = deep_ter_debug_map->get (exp);
5132 if (slot)
5133 t = *slot;
5135 if (t == NULL_TREE)
5136 t = gimple_assign_rhs_to_tree (g);
5137 op0 = expand_debug_expr (t);
5138 if (!op0)
5139 return NULL;
5141 else
5143 /* If this is a reference to an incoming value of
5144 parameter that is never used in the code or where the
5145 incoming value is never used in the code, use
5146 PARM_DECL's DECL_RTL if set. */
5147 if (SSA_NAME_IS_DEFAULT_DEF (exp)
5148 && SSA_NAME_VAR (exp)
5149 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL
5150 && has_zero_uses (exp))
5152 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
5153 if (op0)
5154 goto adjust_mode;
5155 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
5156 if (op0)
5157 goto adjust_mode;
5160 int part = var_to_partition (SA.map, exp);
5162 if (part == NO_PARTITION)
5163 return NULL;
5165 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
5167 op0 = copy_rtx (SA.partition_to_pseudo[part]);
5169 goto adjust_mode;
5172 case ERROR_MARK:
5173 return NULL;
5175 /* Vector stuff. For most of the codes we don't have rtl codes. */
5176 case REALIGN_LOAD_EXPR:
5177 case VEC_COND_EXPR:
5178 case VEC_PACK_FIX_TRUNC_EXPR:
5179 case VEC_PACK_FLOAT_EXPR:
5180 case VEC_PACK_SAT_EXPR:
5181 case VEC_PACK_TRUNC_EXPR:
5182 case VEC_UNPACK_FIX_TRUNC_HI_EXPR:
5183 case VEC_UNPACK_FIX_TRUNC_LO_EXPR:
5184 case VEC_UNPACK_FLOAT_HI_EXPR:
5185 case VEC_UNPACK_FLOAT_LO_EXPR:
5186 case VEC_UNPACK_HI_EXPR:
5187 case VEC_UNPACK_LO_EXPR:
5188 case VEC_WIDEN_MULT_HI_EXPR:
5189 case VEC_WIDEN_MULT_LO_EXPR:
5190 case VEC_WIDEN_MULT_EVEN_EXPR:
5191 case VEC_WIDEN_MULT_ODD_EXPR:
5192 case VEC_WIDEN_LSHIFT_HI_EXPR:
5193 case VEC_WIDEN_LSHIFT_LO_EXPR:
5194 case VEC_PERM_EXPR:
5195 case VEC_DUPLICATE_EXPR:
5196 case VEC_SERIES_EXPR:
5197 case SAD_EXPR:
5198 return NULL;
5200 /* Misc codes. */
5201 case ADDR_SPACE_CONVERT_EXPR:
5202 case FIXED_CONVERT_EXPR:
5203 case OBJ_TYPE_REF:
5204 case WITH_SIZE_EXPR:
5205 case BIT_INSERT_EXPR:
5206 return NULL;
5208 case DOT_PROD_EXPR:
5209 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5210 && SCALAR_INT_MODE_P (mode))
5213 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5214 0)))
5215 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5216 inner_mode);
5218 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5219 1)))
5220 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
5221 inner_mode);
5222 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5223 return simplify_gen_binary (PLUS, mode, op0, op2);
5225 return NULL;
5227 case WIDEN_MULT_EXPR:
5228 case WIDEN_MULT_PLUS_EXPR:
5229 case WIDEN_MULT_MINUS_EXPR:
5230 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5231 && SCALAR_INT_MODE_P (mode))
5233 inner_mode = GET_MODE (op0);
5234 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
5235 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5236 else
5237 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5238 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
5239 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
5240 else
5241 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
5242 op0 = simplify_gen_binary (MULT, mode, op0, op1);
5243 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
5244 return op0;
5245 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
5246 return simplify_gen_binary (PLUS, mode, op0, op2);
5247 else
5248 return simplify_gen_binary (MINUS, mode, op2, op0);
5250 return NULL;
5252 case MULT_HIGHPART_EXPR:
5253 /* ??? Similar to the above. */
5254 return NULL;
5256 case WIDEN_SUM_EXPR:
5257 case WIDEN_LSHIFT_EXPR:
5258 if (SCALAR_INT_MODE_P (GET_MODE (op0))
5259 && SCALAR_INT_MODE_P (mode))
5262 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
5263 0)))
5264 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
5265 inner_mode);
5266 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
5267 ? ASHIFT : PLUS, mode, op0, op1);
5269 return NULL;
5271 default:
5272 flag_unsupported:
5273 if (flag_checking)
5275 debug_tree (exp);
5276 gcc_unreachable ();
5278 return NULL;
5282 /* Return an RTX equivalent to the source bind value of the tree expression
5283 EXP. */
5285 static rtx
5286 expand_debug_source_expr (tree exp)
5288 rtx op0 = NULL_RTX;
5289 machine_mode mode = VOIDmode, inner_mode;
5291 switch (TREE_CODE (exp))
5293 case VAR_DECL:
5294 if (DECL_ABSTRACT_ORIGIN (exp))
5295 return expand_debug_source_expr (DECL_ABSTRACT_ORIGIN (exp));
5296 break;
5297 case PARM_DECL:
5299 mode = DECL_MODE (exp);
5300 op0 = expand_debug_parm_decl (exp);
5301 if (op0)
5302 break;
5303 /* See if this isn't an argument that has been completely
5304 optimized out. */
5305 if (!DECL_RTL_SET_P (exp)
5306 && !DECL_INCOMING_RTL (exp)
5307 && DECL_ABSTRACT_ORIGIN (current_function_decl))
5309 tree aexp = DECL_ORIGIN (exp);
5310 if (DECL_CONTEXT (aexp)
5311 == DECL_ABSTRACT_ORIGIN (current_function_decl))
5313 vec<tree, va_gc> **debug_args;
5314 unsigned int ix;
5315 tree ddecl;
5316 debug_args = decl_debug_args_lookup (current_function_decl);
5317 if (debug_args != NULL)
5319 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
5320 ix += 2)
5321 if (ddecl == aexp)
5322 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
5326 break;
5328 default:
5329 break;
5332 if (op0 == NULL_RTX)
5333 return NULL_RTX;
5335 inner_mode = GET_MODE (op0);
5336 if (mode == inner_mode)
5337 return op0;
5339 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
5341 if (GET_MODE_UNIT_BITSIZE (mode)
5342 == GET_MODE_UNIT_BITSIZE (inner_mode))
5343 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
5344 else if (GET_MODE_UNIT_BITSIZE (mode)
5345 < GET_MODE_UNIT_BITSIZE (inner_mode))
5346 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
5347 else
5348 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
5350 else if (FLOAT_MODE_P (mode))
5351 gcc_unreachable ();
5352 else if (FLOAT_MODE_P (inner_mode))
5354 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5355 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
5356 else
5357 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
5359 else if (GET_MODE_UNIT_PRECISION (mode)
5360 == GET_MODE_UNIT_PRECISION (inner_mode))
5361 op0 = lowpart_subreg (mode, op0, inner_mode);
5362 else if (GET_MODE_UNIT_PRECISION (mode)
5363 < GET_MODE_UNIT_PRECISION (inner_mode))
5364 op0 = simplify_gen_unary (TRUNCATE, mode, op0, inner_mode);
5365 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
5366 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
5367 else
5368 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
5370 return op0;
5373 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
5374 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
5375 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
5377 static void
5378 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
5380 rtx exp = *exp_p;
5382 if (exp == NULL_RTX)
5383 return;
5385 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
5386 return;
5388 if (depth == 4)
5390 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
5391 rtx dval = make_debug_expr_from_rtl (exp);
5393 /* Emit a debug bind insn before INSN. */
5394 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
5395 DEBUG_EXPR_TREE_DECL (dval), exp,
5396 VAR_INIT_STATUS_INITIALIZED);
5398 emit_debug_insn_before (bind, insn);
5399 *exp_p = dval;
5400 return;
5403 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
5404 int i, j;
5405 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
5406 switch (*format_ptr++)
5408 case 'e':
5409 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
5410 break;
5412 case 'E':
5413 case 'V':
5414 for (j = 0; j < XVECLEN (exp, i); j++)
5415 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
5416 break;
5418 default:
5419 break;
5423 /* Expand the _LOCs in debug insns. We run this after expanding all
5424 regular insns, so that any variables referenced in the function
5425 will have their DECL_RTLs set. */
5427 static void
5428 expand_debug_locations (void)
5430 rtx_insn *insn;
5431 rtx_insn *last = get_last_insn ();
5432 int save_strict_alias = flag_strict_aliasing;
5434 /* New alias sets while setting up memory attributes cause
5435 -fcompare-debug failures, even though it doesn't bring about any
5436 codegen changes. */
5437 flag_strict_aliasing = 0;
5439 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
5440 if (DEBUG_BIND_INSN_P (insn))
5442 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
5443 rtx val;
5444 rtx_insn *prev_insn, *insn2;
5445 machine_mode mode;
5447 if (value == NULL_TREE)
5448 val = NULL_RTX;
5449 else
5451 if (INSN_VAR_LOCATION_STATUS (insn)
5452 == VAR_INIT_STATUS_UNINITIALIZED)
5453 val = expand_debug_source_expr (value);
5454 /* The avoid_deep_ter_for_debug function inserts
5455 debug bind stmts after SSA_NAME definition, with the
5456 SSA_NAME as the whole bind location. Disable temporarily
5457 expansion of that SSA_NAME into the DEBUG_EXPR_DECL
5458 being defined in this DEBUG_INSN. */
5459 else if (deep_ter_debug_map && TREE_CODE (value) == SSA_NAME)
5461 tree *slot = deep_ter_debug_map->get (value);
5462 if (slot)
5464 if (*slot == INSN_VAR_LOCATION_DECL (insn))
5465 *slot = NULL_TREE;
5466 else
5467 slot = NULL;
5469 val = expand_debug_expr (value);
5470 if (slot)
5471 *slot = INSN_VAR_LOCATION_DECL (insn);
5473 else
5474 val = expand_debug_expr (value);
5475 gcc_assert (last == get_last_insn ());
5478 if (!val)
5479 val = gen_rtx_UNKNOWN_VAR_LOC ();
5480 else
5482 mode = GET_MODE (INSN_VAR_LOCATION (insn));
5484 gcc_assert (mode == GET_MODE (val)
5485 || (GET_MODE (val) == VOIDmode
5486 && (CONST_SCALAR_INT_P (val)
5487 || GET_CODE (val) == CONST_FIXED
5488 || GET_CODE (val) == LABEL_REF)));
5491 INSN_VAR_LOCATION_LOC (insn) = val;
5492 prev_insn = PREV_INSN (insn);
5493 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
5494 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
5497 flag_strict_aliasing = save_strict_alias;
5500 /* Performs swapping operands of commutative operations to expand
5501 the expensive one first. */
5503 static void
5504 reorder_operands (basic_block bb)
5506 unsigned int *lattice; /* Hold cost of each statement. */
5507 unsigned int i = 0, n = 0;
5508 gimple_stmt_iterator gsi;
5509 gimple_seq stmts;
5510 gimple *stmt;
5511 bool swap;
5512 tree op0, op1;
5513 ssa_op_iter iter;
5514 use_operand_p use_p;
5515 gimple *def0, *def1;
5517 /* Compute cost of each statement using estimate_num_insns. */
5518 stmts = bb_seq (bb);
5519 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5521 stmt = gsi_stmt (gsi);
5522 if (!is_gimple_debug (stmt))
5523 gimple_set_uid (stmt, n++);
5525 lattice = XNEWVEC (unsigned int, n);
5526 for (gsi = gsi_start (stmts); !gsi_end_p (gsi); gsi_next (&gsi))
5528 unsigned cost;
5529 stmt = gsi_stmt (gsi);
5530 if (is_gimple_debug (stmt))
5531 continue;
5532 cost = estimate_num_insns (stmt, &eni_size_weights);
5533 lattice[i] = cost;
5534 FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter, SSA_OP_USE)
5536 tree use = USE_FROM_PTR (use_p);
5537 gimple *def_stmt;
5538 if (TREE_CODE (use) != SSA_NAME)
5539 continue;
5540 def_stmt = get_gimple_for_ssa_name (use);
5541 if (!def_stmt)
5542 continue;
5543 lattice[i] += lattice[gimple_uid (def_stmt)];
5545 i++;
5546 if (!is_gimple_assign (stmt)
5547 || !commutative_tree_code (gimple_assign_rhs_code (stmt)))
5548 continue;
5549 op0 = gimple_op (stmt, 1);
5550 op1 = gimple_op (stmt, 2);
5551 if (TREE_CODE (op0) != SSA_NAME
5552 || TREE_CODE (op1) != SSA_NAME)
5553 continue;
5554 /* Swap operands if the second one is more expensive. */
5555 def0 = get_gimple_for_ssa_name (op0);
5556 def1 = get_gimple_for_ssa_name (op1);
5557 if (!def1)
5558 continue;
5559 swap = false;
5560 if (!def0 || lattice[gimple_uid (def1)] > lattice[gimple_uid (def0)])
5561 swap = true;
5562 if (swap)
5564 if (dump_file && (dump_flags & TDF_DETAILS))
5566 fprintf (dump_file, "Swap operands in stmt:\n");
5567 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
5568 fprintf (dump_file, "Cost left opnd=%d, right opnd=%d\n",
5569 def0 ? lattice[gimple_uid (def0)] : 0,
5570 lattice[gimple_uid (def1)]);
5572 swap_ssa_operands (stmt, gimple_assign_rhs1_ptr (stmt),
5573 gimple_assign_rhs2_ptr (stmt));
5576 XDELETE (lattice);
5579 /* Expand basic block BB from GIMPLE trees to RTL. */
5581 static basic_block
5582 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
5584 gimple_stmt_iterator gsi;
5585 gimple_seq stmts;
5586 gimple *stmt = NULL;
5587 rtx_note *note = NULL;
5588 rtx_insn *last;
5589 edge e;
5590 edge_iterator ei;
5592 if (dump_file)
5593 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
5594 bb->index);
5596 /* Note that since we are now transitioning from GIMPLE to RTL, we
5597 cannot use the gsi_*_bb() routines because they expect the basic
5598 block to be in GIMPLE, instead of RTL. Therefore, we need to
5599 access the BB sequence directly. */
5600 if (optimize)
5601 reorder_operands (bb);
5602 stmts = bb_seq (bb);
5603 bb->il.gimple.seq = NULL;
5604 bb->il.gimple.phi_nodes = NULL;
5605 rtl_profile_for_bb (bb);
5606 init_rtl_bb_info (bb);
5607 bb->flags |= BB_RTL;
5609 /* Remove the RETURN_EXPR if we may fall though to the exit
5610 instead. */
5611 gsi = gsi_last (stmts);
5612 if (!gsi_end_p (gsi)
5613 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
5615 greturn *ret_stmt = as_a <greturn *> (gsi_stmt (gsi));
5617 gcc_assert (single_succ_p (bb));
5618 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
5620 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
5621 && !gimple_return_retval (ret_stmt))
5623 gsi_remove (&gsi, false);
5624 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
5628 gsi = gsi_start (stmts);
5629 if (!gsi_end_p (gsi))
5631 stmt = gsi_stmt (gsi);
5632 if (gimple_code (stmt) != GIMPLE_LABEL)
5633 stmt = NULL;
5636 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
5638 if (stmt || elt)
5640 gcc_checking_assert (!note);
5641 last = get_last_insn ();
5643 if (stmt)
5645 expand_gimple_stmt (stmt);
5646 gsi_next (&gsi);
5649 if (elt)
5650 emit_label (*elt);
5652 BB_HEAD (bb) = NEXT_INSN (last);
5653 if (NOTE_P (BB_HEAD (bb)))
5654 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
5655 gcc_assert (LABEL_P (BB_HEAD (bb)));
5656 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
5658 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5660 else
5661 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
5663 if (note)
5664 NOTE_BASIC_BLOCK (note) = bb;
5666 for (; !gsi_end_p (gsi); gsi_next (&gsi))
5668 basic_block new_bb;
5670 stmt = gsi_stmt (gsi);
5672 /* If this statement is a non-debug one, and we generate debug
5673 insns, then this one might be the last real use of a TERed
5674 SSA_NAME, but where there are still some debug uses further
5675 down. Expanding the current SSA name in such further debug
5676 uses by their RHS might lead to wrong debug info, as coalescing
5677 might make the operands of such RHS be placed into the same
5678 pseudo as something else. Like so:
5679 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
5680 use(a_1);
5681 a_2 = ...
5682 #DEBUG ... => a_1
5683 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
5684 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
5685 the write to a_2 would actually have clobbered the place which
5686 formerly held a_0.
5688 So, instead of that, we recognize the situation, and generate
5689 debug temporaries at the last real use of TERed SSA names:
5690 a_1 = a_0 + 1;
5691 #DEBUG #D1 => a_1
5692 use(a_1);
5693 a_2 = ...
5694 #DEBUG ... => #D1
5696 if (MAY_HAVE_DEBUG_BIND_INSNS
5697 && SA.values
5698 && !is_gimple_debug (stmt))
5700 ssa_op_iter iter;
5701 tree op;
5702 gimple *def;
5704 location_t sloc = curr_insn_location ();
5706 /* Look for SSA names that have their last use here (TERed
5707 names always have only one real use). */
5708 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5709 if ((def = get_gimple_for_ssa_name (op)))
5711 imm_use_iterator imm_iter;
5712 use_operand_p use_p;
5713 bool have_debug_uses = false;
5715 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5717 if (gimple_debug_bind_p (USE_STMT (use_p)))
5719 have_debug_uses = true;
5720 break;
5724 if (have_debug_uses)
5726 /* OP is a TERed SSA name, with DEF its defining
5727 statement, and where OP is used in further debug
5728 instructions. Generate a debug temporary, and
5729 replace all uses of OP in debug insns with that
5730 temporary. */
5731 gimple *debugstmt;
5732 tree value = gimple_assign_rhs_to_tree (def);
5733 tree vexpr = make_node (DEBUG_EXPR_DECL);
5734 rtx val;
5735 machine_mode mode;
5737 set_curr_insn_location (gimple_location (def));
5739 DECL_ARTIFICIAL (vexpr) = 1;
5740 TREE_TYPE (vexpr) = TREE_TYPE (value);
5741 if (DECL_P (value))
5742 mode = DECL_MODE (value);
5743 else
5744 mode = TYPE_MODE (TREE_TYPE (value));
5745 SET_DECL_MODE (vexpr, mode);
5747 val = gen_rtx_VAR_LOCATION
5748 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5750 emit_debug_insn (val);
5752 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5754 if (!gimple_debug_bind_p (debugstmt))
5755 continue;
5757 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5758 SET_USE (use_p, vexpr);
5760 update_stmt (debugstmt);
5764 set_curr_insn_location (sloc);
5767 currently_expanding_gimple_stmt = stmt;
5769 /* Expand this statement, then evaluate the resulting RTL and
5770 fixup the CFG accordingly. */
5771 if (gimple_code (stmt) == GIMPLE_COND)
5773 new_bb = expand_gimple_cond (bb, as_a <gcond *> (stmt));
5774 if (new_bb)
5775 return new_bb;
5777 else if (is_gimple_debug (stmt))
5779 location_t sloc = curr_insn_location ();
5780 gimple_stmt_iterator nsi = gsi;
5782 for (;;)
5784 tree var;
5785 tree value = NULL_TREE;
5786 rtx val = NULL_RTX;
5787 machine_mode mode;
5789 if (!gimple_debug_nonbind_marker_p (stmt))
5791 if (gimple_debug_bind_p (stmt))
5793 var = gimple_debug_bind_get_var (stmt);
5795 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5796 && TREE_CODE (var) != LABEL_DECL
5797 && !target_for_debug_bind (var))
5798 goto delink_debug_stmt;
5800 if (DECL_P (var))
5801 mode = DECL_MODE (var);
5802 else
5803 mode = TYPE_MODE (TREE_TYPE (var));
5805 if (gimple_debug_bind_has_value_p (stmt))
5806 value = gimple_debug_bind_get_value (stmt);
5808 val = gen_rtx_VAR_LOCATION
5809 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5811 else if (gimple_debug_source_bind_p (stmt))
5813 var = gimple_debug_source_bind_get_var (stmt);
5815 value = gimple_debug_source_bind_get_value (stmt);
5817 mode = DECL_MODE (var);
5819 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5820 VAR_INIT_STATUS_UNINITIALIZED);
5822 else
5823 gcc_unreachable ();
5825 /* If this function was first compiled with markers
5826 enabled, but they're now disable (e.g. LTO), drop
5827 them on the floor. */
5828 else if (gimple_debug_nonbind_marker_p (stmt)
5829 && !MAY_HAVE_DEBUG_MARKER_INSNS)
5830 goto delink_debug_stmt;
5831 else if (gimple_debug_begin_stmt_p (stmt))
5832 val = GEN_RTX_DEBUG_MARKER_BEGIN_STMT_PAT ();
5833 else if (gimple_debug_inline_entry_p (stmt))
5835 tree block = gimple_block (stmt);
5837 if (block)
5838 val = GEN_RTX_DEBUG_MARKER_INLINE_ENTRY_PAT ();
5839 else
5840 goto delink_debug_stmt;
5842 else
5843 gcc_unreachable ();
5845 last = get_last_insn ();
5847 set_curr_insn_location (gimple_location (stmt));
5849 emit_debug_insn (val);
5851 if (dump_file && (dump_flags & TDF_DETAILS))
5853 /* We can't dump the insn with a TREE where an RTX
5854 is expected. */
5855 if (GET_CODE (val) == VAR_LOCATION)
5857 gcc_checking_assert (PAT_VAR_LOCATION_LOC (val) == (rtx)value);
5858 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5860 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5861 if (GET_CODE (val) == VAR_LOCATION)
5862 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5865 delink_debug_stmt:
5866 /* In order not to generate too many debug temporaries,
5867 we delink all uses of debug statements we already expanded.
5868 Therefore debug statements between definition and real
5869 use of TERed SSA names will continue to use the SSA name,
5870 and not be replaced with debug temps. */
5871 delink_stmt_imm_use (stmt);
5873 gsi = nsi;
5874 gsi_next (&nsi);
5875 if (gsi_end_p (nsi))
5876 break;
5877 stmt = gsi_stmt (nsi);
5878 if (!is_gimple_debug (stmt))
5879 break;
5882 set_curr_insn_location (sloc);
5884 else
5886 gcall *call_stmt = dyn_cast <gcall *> (stmt);
5887 if (call_stmt
5888 && gimple_call_tail_p (call_stmt)
5889 && disable_tail_calls)
5890 gimple_call_set_tail (call_stmt, false);
5892 if (call_stmt && gimple_call_tail_p (call_stmt))
5894 bool can_fallthru;
5895 new_bb = expand_gimple_tailcall (bb, call_stmt, &can_fallthru);
5896 if (new_bb)
5898 if (can_fallthru)
5899 bb = new_bb;
5900 else
5901 return new_bb;
5904 else
5906 def_operand_p def_p;
5907 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5909 if (def_p != NULL)
5911 /* Ignore this stmt if it is in the list of
5912 replaceable expressions. */
5913 if (SA.values
5914 && bitmap_bit_p (SA.values,
5915 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5916 continue;
5918 last = expand_gimple_stmt (stmt);
5919 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5924 currently_expanding_gimple_stmt = NULL;
5926 /* Expand implicit goto and convert goto_locus. */
5927 FOR_EACH_EDGE (e, ei, bb->succs)
5929 if (e->goto_locus != UNKNOWN_LOCATION)
5930 set_curr_insn_location (e->goto_locus);
5931 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5933 emit_jump (label_rtx_for_bb (e->dest));
5934 e->flags &= ~EDGE_FALLTHRU;
5938 /* Expanded RTL can create a jump in the last instruction of block.
5939 This later might be assumed to be a jump to successor and break edge insertion.
5940 We need to insert dummy move to prevent this. PR41440. */
5941 if (single_succ_p (bb)
5942 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5943 && (last = get_last_insn ())
5944 && (JUMP_P (last)
5945 || (DEBUG_INSN_P (last)
5946 && JUMP_P (prev_nondebug_insn (last)))))
5948 rtx dummy = gen_reg_rtx (SImode);
5949 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5952 do_pending_stack_adjust ();
5954 /* Find the block tail. The last insn in the block is the insn
5955 before a barrier and/or table jump insn. */
5956 last = get_last_insn ();
5957 if (BARRIER_P (last))
5958 last = PREV_INSN (last);
5959 if (JUMP_TABLE_DATA_P (last))
5960 last = PREV_INSN (PREV_INSN (last));
5961 if (BARRIER_P (last))
5962 last = PREV_INSN (last);
5963 BB_END (bb) = last;
5965 update_bb_for_insn (bb);
5967 return bb;
5971 /* Create a basic block for initialization code. */
5973 static basic_block
5974 construct_init_block (void)
5976 basic_block init_block, first_block;
5977 edge e = NULL;
5978 int flags;
5980 /* Multiple entry points not supported yet. */
5981 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5982 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5983 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5984 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5985 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5987 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5989 /* When entry edge points to first basic block, we don't need jump,
5990 otherwise we have to jump into proper target. */
5991 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5993 tree label = gimple_block_label (e->dest);
5995 emit_jump (jump_target_rtx (label));
5996 flags = 0;
5998 else
5999 flags = EDGE_FALLTHRU;
6001 init_block = create_basic_block (NEXT_INSN (get_insns ()),
6002 get_last_insn (),
6003 ENTRY_BLOCK_PTR_FOR_FN (cfun));
6004 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
6005 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6006 if (e)
6008 first_block = e->dest;
6009 redirect_edge_succ (e, init_block);
6010 make_single_succ_edge (init_block, first_block, flags);
6012 else
6013 make_single_succ_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6014 EDGE_FALLTHRU);
6016 update_bb_for_insn (init_block);
6017 return init_block;
6020 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
6021 found in the block tree. */
6023 static void
6024 set_block_levels (tree block, int level)
6026 while (block)
6028 BLOCK_NUMBER (block) = level;
6029 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
6030 block = BLOCK_CHAIN (block);
6034 /* Create a block containing landing pads and similar stuff. */
6036 static void
6037 construct_exit_block (void)
6039 rtx_insn *head = get_last_insn ();
6040 rtx_insn *end;
6041 basic_block exit_block;
6042 edge e, e2;
6043 unsigned ix;
6044 edge_iterator ei;
6045 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
6046 rtx_insn *orig_end = BB_END (prev_bb);
6048 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
6050 /* Make sure the locus is set to the end of the function, so that
6051 epilogue line numbers and warnings are set properly. */
6052 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
6053 input_location = cfun->function_end_locus;
6055 /* Generate rtl for function exit. */
6056 expand_function_end ();
6058 end = get_last_insn ();
6059 if (head == end)
6060 return;
6061 /* While emitting the function end we could move end of the last basic
6062 block. */
6063 BB_END (prev_bb) = orig_end;
6064 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
6065 head = NEXT_INSN (head);
6066 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
6067 bb count counting will be confused. Any instructions before that
6068 label are emitted for the case where PREV_BB falls through into the
6069 exit block, so append those instructions to prev_bb in that case. */
6070 if (NEXT_INSN (head) != return_label)
6072 while (NEXT_INSN (head) != return_label)
6074 if (!NOTE_P (NEXT_INSN (head)))
6075 BB_END (prev_bb) = NEXT_INSN (head);
6076 head = NEXT_INSN (head);
6079 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
6080 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
6081 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
6083 ix = 0;
6084 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
6086 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
6087 if (!(e->flags & EDGE_ABNORMAL))
6088 redirect_edge_succ (e, exit_block);
6089 else
6090 ix++;
6093 e = make_single_succ_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun),
6094 EDGE_FALLTHRU);
6095 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
6096 if (e2 != e)
6098 exit_block->count -= e2->count ();
6100 update_bb_for_insn (exit_block);
6103 /* Helper function for discover_nonconstant_array_refs.
6104 Look for ARRAY_REF nodes with non-constant indexes and mark them
6105 addressable. */
6107 static tree
6108 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
6109 void *data ATTRIBUTE_UNUSED)
6111 tree t = *tp;
6113 if (IS_TYPE_OR_DECL_P (t))
6114 *walk_subtrees = 0;
6115 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6117 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6118 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
6119 && (!TREE_OPERAND (t, 2)
6120 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6121 || (TREE_CODE (t) == COMPONENT_REF
6122 && (!TREE_OPERAND (t,2)
6123 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
6124 || TREE_CODE (t) == BIT_FIELD_REF
6125 || TREE_CODE (t) == REALPART_EXPR
6126 || TREE_CODE (t) == IMAGPART_EXPR
6127 || TREE_CODE (t) == VIEW_CONVERT_EXPR
6128 || CONVERT_EXPR_P (t))
6129 t = TREE_OPERAND (t, 0);
6131 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
6133 t = get_base_address (t);
6134 if (t && DECL_P (t)
6135 && DECL_MODE (t) != BLKmode)
6136 TREE_ADDRESSABLE (t) = 1;
6139 *walk_subtrees = 0;
6141 /* References of size POLY_INT_CST to a fixed-size object must go
6142 through memory. It's more efficient to force that here than
6143 to create temporary slots on the fly. */
6144 else if ((TREE_CODE (t) == MEM_REF || TREE_CODE (t) == TARGET_MEM_REF)
6145 && TYPE_SIZE (TREE_TYPE (t))
6146 && POLY_INT_CST_P (TYPE_SIZE (TREE_TYPE (t))))
6148 tree base = get_base_address (t);
6149 if (base
6150 && DECL_P (base)
6151 && DECL_MODE (base) != BLKmode
6152 && GET_MODE_SIZE (DECL_MODE (base)).is_constant ())
6153 TREE_ADDRESSABLE (base) = 1;
6154 *walk_subtrees = 0;
6157 return NULL_TREE;
6160 /* If there's a chance to get a pseudo for t then if it would be of float mode
6161 and the actual access is via an integer mode (lowered memcpy or similar
6162 access) then avoid the register expansion if the mode likely is not storage
6163 suitable for raw bits processing (like XFmode on i?86). */
6165 static void
6166 avoid_type_punning_on_regs (tree t)
6168 machine_mode access_mode = TYPE_MODE (TREE_TYPE (t));
6169 if (access_mode != BLKmode
6170 && !SCALAR_INT_MODE_P (access_mode))
6171 return;
6172 tree base = get_base_address (t);
6173 if (DECL_P (base)
6174 && !TREE_ADDRESSABLE (base)
6175 && FLOAT_MODE_P (DECL_MODE (base))
6176 && maybe_lt (GET_MODE_PRECISION (DECL_MODE (base)),
6177 GET_MODE_BITSIZE (GET_MODE_INNER (DECL_MODE (base))))
6178 /* Double check in the expensive way we really would get a pseudo. */
6179 && use_register_for_decl (base))
6180 TREE_ADDRESSABLE (base) = 1;
6183 /* RTL expansion is not able to compile array references with variable
6184 offsets for arrays stored in single register. Discover such
6185 expressions and mark variables as addressable to avoid this
6186 scenario. */
6188 static void
6189 discover_nonconstant_array_refs (void)
6191 basic_block bb;
6192 gimple_stmt_iterator gsi;
6194 FOR_EACH_BB_FN (bb, cfun)
6195 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6197 gimple *stmt = gsi_stmt (gsi);
6198 if (!is_gimple_debug (stmt))
6200 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
6201 gcall *call = dyn_cast <gcall *> (stmt);
6202 if (call && gimple_call_internal_p (call))
6203 switch (gimple_call_internal_fn (call))
6205 case IFN_LOAD_LANES:
6206 /* The source must be a MEM. */
6207 mark_addressable (gimple_call_arg (call, 0));
6208 break;
6209 case IFN_STORE_LANES:
6210 /* The destination must be a MEM. */
6211 mark_addressable (gimple_call_lhs (call));
6212 break;
6213 default:
6214 break;
6216 if (gimple_vdef (stmt))
6218 tree t = gimple_get_lhs (stmt);
6219 if (t && REFERENCE_CLASS_P (t))
6220 avoid_type_punning_on_regs (t);
6226 /* This function sets crtl->args.internal_arg_pointer to a virtual
6227 register if DRAP is needed. Local register allocator will replace
6228 virtual_incoming_args_rtx with the virtual register. */
6230 static void
6231 expand_stack_alignment (void)
6233 rtx drap_rtx;
6234 unsigned int preferred_stack_boundary;
6236 if (! SUPPORTS_STACK_ALIGNMENT)
6237 return;
6239 if (cfun->calls_alloca
6240 || cfun->has_nonlocal_label
6241 || crtl->has_nonlocal_goto)
6242 crtl->need_drap = true;
6244 /* Call update_stack_boundary here again to update incoming stack
6245 boundary. It may set incoming stack alignment to a different
6246 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
6247 use the minimum incoming stack alignment to check if it is OK
6248 to perform sibcall optimization since sibcall optimization will
6249 only align the outgoing stack to incoming stack boundary. */
6250 if (targetm.calls.update_stack_boundary)
6251 targetm.calls.update_stack_boundary ();
6253 /* The incoming stack frame has to be aligned at least at
6254 parm_stack_boundary. */
6255 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
6257 /* Update crtl->stack_alignment_estimated and use it later to align
6258 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
6259 exceptions since callgraph doesn't collect incoming stack alignment
6260 in this case. */
6261 if (cfun->can_throw_non_call_exceptions
6262 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
6263 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
6264 else
6265 preferred_stack_boundary = crtl->preferred_stack_boundary;
6266 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
6267 crtl->stack_alignment_estimated = preferred_stack_boundary;
6268 if (preferred_stack_boundary > crtl->stack_alignment_needed)
6269 crtl->stack_alignment_needed = preferred_stack_boundary;
6271 gcc_assert (crtl->stack_alignment_needed
6272 <= crtl->stack_alignment_estimated);
6274 crtl->stack_realign_needed
6275 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
6276 crtl->stack_realign_tried = crtl->stack_realign_needed;
6278 crtl->stack_realign_processed = true;
6280 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
6281 alignment. */
6282 gcc_assert (targetm.calls.get_drap_rtx != NULL);
6283 drap_rtx = targetm.calls.get_drap_rtx ();
6285 /* stack_realign_drap and drap_rtx must match. */
6286 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
6288 /* Do nothing if NULL is returned, which means DRAP is not needed. */
6289 if (drap_rtx != NULL)
6291 crtl->args.internal_arg_pointer = drap_rtx;
6293 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
6294 needed. */
6295 fixup_tail_calls ();
6300 static void
6301 expand_main_function (void)
6303 #if (defined(INVOKE__main) \
6304 || (!defined(HAS_INIT_SECTION) \
6305 && !defined(INIT_SECTION_ASM_OP) \
6306 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
6307 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode);
6308 #endif
6312 /* Expand code to initialize the stack_protect_guard. This is invoked at
6313 the beginning of a function to be protected. */
6315 static void
6316 stack_protect_prologue (void)
6318 tree guard_decl = targetm.stack_protect_guard ();
6319 rtx x, y;
6321 crtl->stack_protect_guard_decl = guard_decl;
6322 x = expand_normal (crtl->stack_protect_guard);
6324 if (targetm.have_stack_protect_combined_set () && guard_decl)
6326 gcc_assert (DECL_P (guard_decl));
6327 y = DECL_RTL (guard_decl);
6329 /* Allow the target to compute address of Y and copy it to X without
6330 leaking Y into a register. This combined address + copy pattern
6331 allows the target to prevent spilling of any intermediate results by
6332 splitting it after register allocator. */
6333 if (rtx_insn *insn = targetm.gen_stack_protect_combined_set (x, y))
6335 emit_insn (insn);
6336 return;
6340 if (guard_decl)
6341 y = expand_normal (guard_decl);
6342 else
6343 y = const0_rtx;
6345 /* Allow the target to copy from Y to X without leaking Y into a
6346 register. */
6347 if (targetm.have_stack_protect_set ())
6348 if (rtx_insn *insn = targetm.gen_stack_protect_set (x, y))
6350 emit_insn (insn);
6351 return;
6354 /* Otherwise do a straight move. */
6355 emit_move_insn (x, y);
6358 /* Translate the intermediate representation contained in the CFG
6359 from GIMPLE trees to RTL.
6361 We do conversion per basic block and preserve/update the tree CFG.
6362 This implies we have to do some magic as the CFG can simultaneously
6363 consist of basic blocks containing RTL and GIMPLE trees. This can
6364 confuse the CFG hooks, so be careful to not manipulate CFG during
6365 the expansion. */
6367 namespace {
6369 const pass_data pass_data_expand =
6371 RTL_PASS, /* type */
6372 "expand", /* name */
6373 OPTGROUP_NONE, /* optinfo_flags */
6374 TV_EXPAND, /* tv_id */
6375 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
6376 | PROP_gimple_lcx
6377 | PROP_gimple_lvec
6378 | PROP_gimple_lva), /* properties_required */
6379 PROP_rtl, /* properties_provided */
6380 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
6381 0, /* todo_flags_start */
6382 0, /* todo_flags_finish */
6385 class pass_expand : public rtl_opt_pass
6387 public:
6388 pass_expand (gcc::context *ctxt)
6389 : rtl_opt_pass (pass_data_expand, ctxt)
6392 /* opt_pass methods: */
6393 virtual unsigned int execute (function *);
6395 }; // class pass_expand
6397 unsigned int
6398 pass_expand::execute (function *fun)
6400 basic_block bb, init_block;
6401 edge_iterator ei;
6402 edge e;
6403 rtx_insn *var_seq, *var_ret_seq;
6404 unsigned i;
6406 timevar_push (TV_OUT_OF_SSA);
6407 rewrite_out_of_ssa (&SA);
6408 timevar_pop (TV_OUT_OF_SSA);
6409 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
6411 if (MAY_HAVE_DEBUG_BIND_STMTS && flag_tree_ter)
6413 gimple_stmt_iterator gsi;
6414 FOR_EACH_BB_FN (bb, cfun)
6415 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
6416 if (gimple_debug_bind_p (gsi_stmt (gsi)))
6417 avoid_deep_ter_for_debug (gsi_stmt (gsi), 0);
6420 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
6421 discover_nonconstant_array_refs ();
6423 /* Make sure all values used by the optimization passes have sane
6424 defaults. */
6425 reg_renumber = 0;
6427 /* Some backends want to know that we are expanding to RTL. */
6428 currently_expanding_to_rtl = 1;
6429 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
6430 free_dominance_info (CDI_DOMINATORS);
6432 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
6434 insn_locations_init ();
6435 if (!DECL_IS_UNDECLARED_BUILTIN (current_function_decl))
6437 /* Eventually, all FEs should explicitly set function_start_locus. */
6438 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
6439 set_curr_insn_location
6440 (DECL_SOURCE_LOCATION (current_function_decl));
6441 else
6442 set_curr_insn_location (fun->function_start_locus);
6444 else
6445 set_curr_insn_location (UNKNOWN_LOCATION);
6446 prologue_location = curr_insn_location ();
6448 #ifdef INSN_SCHEDULING
6449 init_sched_attrs ();
6450 #endif
6452 /* Make sure first insn is a note even if we don't want linenums.
6453 This makes sure the first insn will never be deleted.
6454 Also, final expects a note to appear there. */
6455 emit_note (NOTE_INSN_DELETED);
6457 targetm.expand_to_rtl_hook ();
6458 crtl->init_stack_alignment ();
6459 fun->cfg->max_jumptable_ents = 0;
6461 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
6462 of the function section at exapnsion time to predict distance of calls. */
6463 resolve_unique_section (current_function_decl, 0, flag_function_sections);
6465 /* Expand the variables recorded during gimple lowering. */
6466 timevar_push (TV_VAR_EXPAND);
6467 start_sequence ();
6469 var_ret_seq = expand_used_vars ();
6471 var_seq = get_insns ();
6472 end_sequence ();
6473 timevar_pop (TV_VAR_EXPAND);
6475 /* Honor stack protection warnings. */
6476 if (warn_stack_protect)
6478 if (fun->calls_alloca)
6479 warning (OPT_Wstack_protector,
6480 "stack protector not protecting local variables: "
6481 "variable length buffer");
6482 if (has_short_buffer && !crtl->stack_protect_guard)
6483 warning (OPT_Wstack_protector,
6484 "stack protector not protecting function: "
6485 "all local arrays are less than %d bytes long",
6486 (int) param_ssp_buffer_size);
6489 /* Set up parameters and prepare for return, for the function. */
6490 expand_function_start (current_function_decl);
6492 /* If we emitted any instructions for setting up the variables,
6493 emit them before the FUNCTION_START note. */
6494 if (var_seq)
6496 emit_insn_before (var_seq, parm_birth_insn);
6498 /* In expand_function_end we'll insert the alloca save/restore
6499 before parm_birth_insn. We've just insertted an alloca call.
6500 Adjust the pointer to match. */
6501 parm_birth_insn = var_seq;
6504 /* Now propagate the RTL assignment of each partition to the
6505 underlying var of each SSA_NAME. */
6506 tree name;
6508 FOR_EACH_SSA_NAME (i, name, cfun)
6510 /* We might have generated new SSA names in
6511 update_alias_info_with_stack_vars. They will have a NULL
6512 defining statements, and won't be part of the partitioning,
6513 so ignore those. */
6514 if (!SSA_NAME_DEF_STMT (name))
6515 continue;
6517 adjust_one_expanded_partition_var (name);
6520 /* Clean up RTL of variables that straddle across multiple
6521 partitions, and check that the rtl of any PARM_DECLs that are not
6522 cleaned up is that of their default defs. */
6523 FOR_EACH_SSA_NAME (i, name, cfun)
6525 int part;
6527 /* We might have generated new SSA names in
6528 update_alias_info_with_stack_vars. They will have a NULL
6529 defining statements, and won't be part of the partitioning,
6530 so ignore those. */
6531 if (!SSA_NAME_DEF_STMT (name))
6532 continue;
6533 part = var_to_partition (SA.map, name);
6534 if (part == NO_PARTITION)
6535 continue;
6537 /* If this decl was marked as living in multiple places, reset
6538 this now to NULL. */
6539 tree var = SSA_NAME_VAR (name);
6540 if (var && DECL_RTL_IF_SET (var) == pc_rtx)
6541 SET_DECL_RTL (var, NULL);
6542 /* Check that the pseudos chosen by assign_parms are those of
6543 the corresponding default defs. */
6544 else if (SSA_NAME_IS_DEFAULT_DEF (name)
6545 && (TREE_CODE (var) == PARM_DECL
6546 || TREE_CODE (var) == RESULT_DECL))
6548 rtx in = DECL_RTL_IF_SET (var);
6549 gcc_assert (in);
6550 rtx out = SA.partition_to_pseudo[part];
6551 gcc_assert (in == out);
6553 /* Now reset VAR's RTL to IN, so that the _EXPR attrs match
6554 those expected by debug backends for each parm and for
6555 the result. This is particularly important for stabs,
6556 whose register elimination from parm's DECL_RTL may cause
6557 -fcompare-debug differences as SET_DECL_RTL changes reg's
6558 attrs. So, make sure the RTL already has the parm as the
6559 EXPR, so that it won't change. */
6560 SET_DECL_RTL (var, NULL_RTX);
6561 if (MEM_P (in))
6562 set_mem_attributes (in, var, true);
6563 SET_DECL_RTL (var, in);
6567 /* If this function is `main', emit a call to `__main'
6568 to run global initializers, etc. */
6569 if (DECL_NAME (current_function_decl)
6570 && MAIN_NAME_P (DECL_NAME (current_function_decl))
6571 && DECL_FILE_SCOPE_P (current_function_decl))
6572 expand_main_function ();
6574 /* Initialize the stack_protect_guard field. This must happen after the
6575 call to __main (if any) so that the external decl is initialized. */
6576 if (crtl->stack_protect_guard && targetm.stack_protect_runtime_enabled_p ())
6577 stack_protect_prologue ();
6579 expand_phi_nodes (&SA);
6581 /* Release any stale SSA redirection data. */
6582 redirect_edge_var_map_empty ();
6584 /* Register rtl specific functions for cfg. */
6585 rtl_register_cfg_hooks ();
6587 init_block = construct_init_block ();
6589 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
6590 remaining edges later. */
6591 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
6592 e->flags &= ~EDGE_EXECUTABLE;
6594 /* If the function has too many markers, drop them while expanding. */
6595 if (cfun->debug_marker_count
6596 >= param_max_debug_marker_count)
6597 cfun->debug_nonbind_markers = false;
6599 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
6600 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
6601 next_bb)
6602 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
6604 if (MAY_HAVE_DEBUG_BIND_INSNS)
6605 expand_debug_locations ();
6607 if (deep_ter_debug_map)
6609 delete deep_ter_debug_map;
6610 deep_ter_debug_map = NULL;
6613 /* Free stuff we no longer need after GIMPLE optimizations. */
6614 free_dominance_info (CDI_DOMINATORS);
6615 free_dominance_info (CDI_POST_DOMINATORS);
6616 delete_tree_cfg_annotations (fun);
6618 timevar_push (TV_OUT_OF_SSA);
6619 finish_out_of_ssa (&SA);
6620 timevar_pop (TV_OUT_OF_SSA);
6622 timevar_push (TV_POST_EXPAND);
6623 /* We are no longer in SSA form. */
6624 fun->gimple_df->in_ssa_p = false;
6625 loops_state_clear (LOOP_CLOSED_SSA);
6627 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
6628 conservatively to true until they are all profile aware. */
6629 delete lab_rtx_for_bb;
6630 free_histograms (fun);
6632 construct_exit_block ();
6633 insn_locations_finalize ();
6635 if (var_ret_seq)
6637 rtx_insn *after = return_label;
6638 rtx_insn *next = NEXT_INSN (after);
6639 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
6640 after = next;
6641 emit_insn_after (var_ret_seq, after);
6644 /* Zap the tree EH table. */
6645 set_eh_throw_stmt_table (fun, NULL);
6647 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
6648 split edges which edge insertions might do. */
6649 rebuild_jump_labels (get_insns ());
6651 /* If we have a single successor to the entry block, put the pending insns
6652 after parm birth, but before NOTE_INSNS_FUNCTION_BEG. */
6653 if (single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
6655 edge e = single_succ_edge (ENTRY_BLOCK_PTR_FOR_FN (fun));
6656 if (e->insns.r)
6658 rtx_insn *insns = e->insns.r;
6659 e->insns.r = NULL;
6660 rebuild_jump_labels_chain (insns);
6661 if (NOTE_P (parm_birth_insn)
6662 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
6663 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
6664 else
6665 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
6669 /* Otherwise, as well as for other edges, take the usual way. */
6670 commit_edge_insertions ();
6672 /* We're done expanding trees to RTL. */
6673 currently_expanding_to_rtl = 0;
6675 flush_mark_addressable_queue ();
6677 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
6678 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
6680 edge e;
6681 edge_iterator ei;
6682 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
6684 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
6685 e->flags &= ~EDGE_EXECUTABLE;
6687 /* At the moment not all abnormal edges match the RTL
6688 representation. It is safe to remove them here as
6689 find_many_sub_basic_blocks will rediscover them.
6690 In the future we should get this fixed properly. */
6691 if ((e->flags & EDGE_ABNORMAL)
6692 && !(e->flags & EDGE_SIBCALL))
6693 remove_edge (e);
6694 else
6695 ei_next (&ei);
6699 auto_sbitmap blocks (last_basic_block_for_fn (fun));
6700 bitmap_ones (blocks);
6701 find_many_sub_basic_blocks (blocks);
6702 purge_all_dead_edges ();
6704 /* After initial rtl generation, call back to finish generating
6705 exception support code. We need to do this before cleaning up
6706 the CFG as the code does not expect dead landing pads. */
6707 if (fun->eh->region_tree != NULL)
6708 finish_eh_generation ();
6710 /* Call expand_stack_alignment after finishing all
6711 updates to crtl->preferred_stack_boundary. */
6712 expand_stack_alignment ();
6714 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
6715 function. */
6716 if (crtl->tail_call_emit)
6717 fixup_tail_calls ();
6719 unsigned HOST_WIDE_INT patch_area_size = function_entry_patch_area_size;
6720 unsigned HOST_WIDE_INT patch_area_entry = function_entry_patch_area_start;
6722 tree patchable_function_entry_attr
6723 = lookup_attribute ("patchable_function_entry",
6724 DECL_ATTRIBUTES (cfun->decl));
6725 if (patchable_function_entry_attr)
6727 tree pp_val = TREE_VALUE (patchable_function_entry_attr);
6728 tree patchable_function_entry_value1 = TREE_VALUE (pp_val);
6730 patch_area_size = tree_to_uhwi (patchable_function_entry_value1);
6731 patch_area_entry = 0;
6732 if (TREE_CHAIN (pp_val) != NULL_TREE)
6734 tree patchable_function_entry_value2
6735 = TREE_VALUE (TREE_CHAIN (pp_val));
6736 patch_area_entry = tree_to_uhwi (patchable_function_entry_value2);
6740 if (patch_area_entry > patch_area_size)
6742 if (patch_area_size > 0)
6743 warning (OPT_Wattributes,
6744 "patchable function entry %wu exceeds size %wu",
6745 patch_area_entry, patch_area_size);
6746 patch_area_entry = 0;
6749 crtl->patch_area_size = patch_area_size;
6750 crtl->patch_area_entry = patch_area_entry;
6752 /* BB subdivision may have created basic blocks that are only reachable
6753 from unlikely bbs but not marked as such in the profile. */
6754 if (optimize)
6755 propagate_unlikely_bbs_forward ();
6757 /* Remove unreachable blocks, otherwise we cannot compute dominators
6758 which are needed for loop state verification. As a side-effect
6759 this also compacts blocks.
6760 ??? We cannot remove trivially dead insns here as for example
6761 the DRAP reg on i?86 is not magically live at this point.
6762 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
6763 cleanup_cfg (CLEANUP_NO_INSN_DEL);
6765 checking_verify_flow_info ();
6767 /* Initialize pseudos allocated for hard registers. */
6768 emit_initial_value_sets ();
6770 /* And finally unshare all RTL. */
6771 unshare_all_rtl ();
6773 /* There's no need to defer outputting this function any more; we
6774 know we want to output it. */
6775 DECL_DEFER_OUTPUT (current_function_decl) = 0;
6777 /* Now that we're done expanding trees to RTL, we shouldn't have any
6778 more CONCATs anywhere. */
6779 generating_concat_p = 0;
6781 if (dump_file)
6783 fprintf (dump_file,
6784 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
6785 /* And the pass manager will dump RTL for us. */
6788 /* If we're emitting a nested function, make sure its parent gets
6789 emitted as well. Doing otherwise confuses debug info. */
6791 tree parent;
6792 for (parent = DECL_CONTEXT (current_function_decl);
6793 parent != NULL_TREE;
6794 parent = get_containing_scope (parent))
6795 if (TREE_CODE (parent) == FUNCTION_DECL)
6796 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
6799 TREE_ASM_WRITTEN (current_function_decl) = 1;
6801 /* After expanding, the return labels are no longer needed. */
6802 return_label = NULL;
6803 naked_return_label = NULL;
6805 /* After expanding, the tm_restart map is no longer needed. */
6806 if (fun->gimple_df->tm_restart)
6807 fun->gimple_df->tm_restart = NULL;
6809 /* Tag the blocks with a depth number so that change_scope can find
6810 the common parent easily. */
6811 set_block_levels (DECL_INITIAL (fun->decl), 0);
6812 default_rtl_profile ();
6814 /* For -dx discard loops now, otherwise IL verify in clean_state will
6815 ICE. */
6816 if (rtl_dump_and_exit)
6818 cfun->curr_properties &= ~PROP_loops;
6819 loop_optimizer_finalize ();
6822 timevar_pop (TV_POST_EXPAND);
6824 return 0;
6827 } // anon namespace
6829 rtl_opt_pass *
6830 make_pass_expand (gcc::context *ctxt)
6832 return new pass_expand (ctxt);