IPA ICF, part 4/5
[official-gcc.git] / gcc / cfgexpand.c
blob5cb96df037fb3b2ef8ecdb1385d416e986e3953a
1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004-2014 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GCC is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "tm.h"
24 #include "rtl.h"
25 #include "hard-reg-set.h"
26 #include "tree.h"
27 #include "stringpool.h"
28 #include "varasm.h"
29 #include "stor-layout.h"
30 #include "stmt.h"
31 #include "print-tree.h"
32 #include "tm_p.h"
33 #include "basic-block.h"
34 #include "function.h"
35 #include "expr.h"
36 #include "langhooks.h"
37 #include "bitmap.h"
38 #include "hash-set.h"
39 #include "tree-ssa-alias.h"
40 #include "internal-fn.h"
41 #include "tree-eh.h"
42 #include "gimple-expr.h"
43 #include "is-a.h"
44 #include "gimple.h"
45 #include "gimple-iterator.h"
46 #include "gimple-walk.h"
47 #include "gimple-ssa.h"
48 #include "cgraph.h"
49 #include "tree-cfg.h"
50 #include "tree-phinodes.h"
51 #include "ssa-iterators.h"
52 #include "tree-ssanames.h"
53 #include "tree-dfa.h"
54 #include "tree-ssa.h"
55 #include "tree-pass.h"
56 #include "except.h"
57 #include "flags.h"
58 #include "diagnostic.h"
59 #include "gimple-pretty-print.h"
60 #include "toplev.h"
61 #include "debug.h"
62 #include "params.h"
63 #include "tree-inline.h"
64 #include "value-prof.h"
65 #include "target.h"
66 #include "tree-ssa-live.h"
67 #include "tree-outof-ssa.h"
68 #include "sbitmap.h"
69 #include "cfgloop.h"
70 #include "regs.h" /* For reg_renumber. */
71 #include "insn-attr.h" /* For INSN_SCHEDULING. */
72 #include "asan.h"
73 #include "tree-ssa-address.h"
74 #include "recog.h"
75 #include "output.h"
76 #include "builtins.h"
78 /* Some systems use __main in a way incompatible with its use in gcc, in these
79 cases use the macros NAME__MAIN to give a quoted symbol and SYMBOL__MAIN to
80 give the same symbol without quotes for an alternative entry point. You
81 must define both, or neither. */
82 #ifndef NAME__MAIN
83 #define NAME__MAIN "__main"
84 #endif
86 /* This variable holds information helping the rewriting of SSA trees
87 into RTL. */
88 struct ssaexpand SA;
90 /* This variable holds the currently expanded gimple statement for purposes
91 of comminucating the profile info to the builtin expanders. */
92 gimple currently_expanding_gimple_stmt;
94 static rtx expand_debug_expr (tree);
96 /* Return an expression tree corresponding to the RHS of GIMPLE
97 statement STMT. */
99 tree
100 gimple_assign_rhs_to_tree (gimple stmt)
102 tree t;
103 enum gimple_rhs_class grhs_class;
105 grhs_class = get_gimple_rhs_class (gimple_expr_code (stmt));
107 if (grhs_class == GIMPLE_TERNARY_RHS)
108 t = build3 (gimple_assign_rhs_code (stmt),
109 TREE_TYPE (gimple_assign_lhs (stmt)),
110 gimple_assign_rhs1 (stmt),
111 gimple_assign_rhs2 (stmt),
112 gimple_assign_rhs3 (stmt));
113 else if (grhs_class == GIMPLE_BINARY_RHS)
114 t = build2 (gimple_assign_rhs_code (stmt),
115 TREE_TYPE (gimple_assign_lhs (stmt)),
116 gimple_assign_rhs1 (stmt),
117 gimple_assign_rhs2 (stmt));
118 else if (grhs_class == GIMPLE_UNARY_RHS)
119 t = build1 (gimple_assign_rhs_code (stmt),
120 TREE_TYPE (gimple_assign_lhs (stmt)),
121 gimple_assign_rhs1 (stmt));
122 else if (grhs_class == GIMPLE_SINGLE_RHS)
124 t = gimple_assign_rhs1 (stmt);
125 /* Avoid modifying this tree in place below. */
126 if ((gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t)
127 && gimple_location (stmt) != EXPR_LOCATION (t))
128 || (gimple_block (stmt)
129 && currently_expanding_to_rtl
130 && EXPR_P (t)))
131 t = copy_node (t);
133 else
134 gcc_unreachable ();
136 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (t))
137 SET_EXPR_LOCATION (t, gimple_location (stmt));
139 return t;
143 #ifndef STACK_ALIGNMENT_NEEDED
144 #define STACK_ALIGNMENT_NEEDED 1
145 #endif
147 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
149 /* Associate declaration T with storage space X. If T is no
150 SSA name this is exactly SET_DECL_RTL, otherwise make the
151 partition of T associated with X. */
152 static inline void
153 set_rtl (tree t, rtx x)
155 if (TREE_CODE (t) == SSA_NAME)
157 SA.partition_to_pseudo[var_to_partition (SA.map, t)] = x;
158 if (x && !MEM_P (x))
159 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (t), x);
160 /* For the benefit of debug information at -O0 (where vartracking
161 doesn't run) record the place also in the base DECL if it's
162 a normal variable (not a parameter). */
163 if (x && x != pc_rtx && TREE_CODE (SSA_NAME_VAR (t)) == VAR_DECL)
165 tree var = SSA_NAME_VAR (t);
166 /* If we don't yet have something recorded, just record it now. */
167 if (!DECL_RTL_SET_P (var))
168 SET_DECL_RTL (var, x);
169 /* If we have it set already to "multiple places" don't
170 change this. */
171 else if (DECL_RTL (var) == pc_rtx)
173 /* If we have something recorded and it's not the same place
174 as we want to record now, we have multiple partitions for the
175 same base variable, with different places. We can't just
176 randomly chose one, hence we have to say that we don't know.
177 This only happens with optimization, and there var-tracking
178 will figure out the right thing. */
179 else if (DECL_RTL (var) != x)
180 SET_DECL_RTL (var, pc_rtx);
183 else
184 SET_DECL_RTL (t, x);
187 /* This structure holds data relevant to one variable that will be
188 placed in a stack slot. */
189 struct stack_var
191 /* The Variable. */
192 tree decl;
194 /* Initially, the size of the variable. Later, the size of the partition,
195 if this variable becomes it's partition's representative. */
196 HOST_WIDE_INT size;
198 /* The *byte* alignment required for this variable. Or as, with the
199 size, the alignment for this partition. */
200 unsigned int alignb;
202 /* The partition representative. */
203 size_t representative;
205 /* The next stack variable in the partition, or EOC. */
206 size_t next;
208 /* The numbers of conflicting stack variables. */
209 bitmap conflicts;
212 #define EOC ((size_t)-1)
214 /* We have an array of such objects while deciding allocation. */
215 static struct stack_var *stack_vars;
216 static size_t stack_vars_alloc;
217 static size_t stack_vars_num;
218 static hash_map<tree, size_t> *decl_to_stack_part;
220 /* Conflict bitmaps go on this obstack. This allows us to destroy
221 all of them in one big sweep. */
222 static bitmap_obstack stack_var_bitmap_obstack;
224 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
225 is non-decreasing. */
226 static size_t *stack_vars_sorted;
228 /* The phase of the stack frame. This is the known misalignment of
229 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
230 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
231 static int frame_phase;
233 /* Used during expand_used_vars to remember if we saw any decls for
234 which we'd like to enable stack smashing protection. */
235 static bool has_protected_decls;
237 /* Used during expand_used_vars. Remember if we say a character buffer
238 smaller than our cutoff threshold. Used for -Wstack-protector. */
239 static bool has_short_buffer;
241 /* Compute the byte alignment to use for DECL. Ignore alignment
242 we can't do with expected alignment of the stack boundary. */
244 static unsigned int
245 align_local_variable (tree decl)
247 unsigned int align = LOCAL_DECL_ALIGNMENT (decl);
248 DECL_ALIGN (decl) = align;
249 return align / BITS_PER_UNIT;
252 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
253 Return the frame offset. */
255 static HOST_WIDE_INT
256 alloc_stack_frame_space (HOST_WIDE_INT size, unsigned HOST_WIDE_INT align)
258 HOST_WIDE_INT offset, new_frame_offset;
260 new_frame_offset = frame_offset;
261 if (FRAME_GROWS_DOWNWARD)
263 new_frame_offset -= size + frame_phase;
264 new_frame_offset &= -align;
265 new_frame_offset += frame_phase;
266 offset = new_frame_offset;
268 else
270 new_frame_offset -= frame_phase;
271 new_frame_offset += align - 1;
272 new_frame_offset &= -align;
273 new_frame_offset += frame_phase;
274 offset = new_frame_offset;
275 new_frame_offset += size;
277 frame_offset = new_frame_offset;
279 if (frame_offset_overflow (frame_offset, cfun->decl))
280 frame_offset = offset = 0;
282 return offset;
285 /* Accumulate DECL into STACK_VARS. */
287 static void
288 add_stack_var (tree decl)
290 struct stack_var *v;
292 if (stack_vars_num >= stack_vars_alloc)
294 if (stack_vars_alloc)
295 stack_vars_alloc = stack_vars_alloc * 3 / 2;
296 else
297 stack_vars_alloc = 32;
298 stack_vars
299 = XRESIZEVEC (struct stack_var, stack_vars, stack_vars_alloc);
301 if (!decl_to_stack_part)
302 decl_to_stack_part = new hash_map<tree, size_t>;
304 v = &stack_vars[stack_vars_num];
305 decl_to_stack_part->put (decl, stack_vars_num);
307 v->decl = decl;
308 v->size = tree_to_uhwi (DECL_SIZE_UNIT (SSAVAR (decl)));
309 /* Ensure that all variables have size, so that &a != &b for any two
310 variables that are simultaneously live. */
311 if (v->size == 0)
312 v->size = 1;
313 v->alignb = align_local_variable (SSAVAR (decl));
314 /* An alignment of zero can mightily confuse us later. */
315 gcc_assert (v->alignb != 0);
317 /* All variables are initially in their own partition. */
318 v->representative = stack_vars_num;
319 v->next = EOC;
321 /* All variables initially conflict with no other. */
322 v->conflicts = NULL;
324 /* Ensure that this decl doesn't get put onto the list twice. */
325 set_rtl (decl, pc_rtx);
327 stack_vars_num++;
330 /* Make the decls associated with luid's X and Y conflict. */
332 static void
333 add_stack_var_conflict (size_t x, size_t y)
335 struct stack_var *a = &stack_vars[x];
336 struct stack_var *b = &stack_vars[y];
337 if (!a->conflicts)
338 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
339 if (!b->conflicts)
340 b->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
341 bitmap_set_bit (a->conflicts, y);
342 bitmap_set_bit (b->conflicts, x);
345 /* Check whether the decls associated with luid's X and Y conflict. */
347 static bool
348 stack_var_conflict_p (size_t x, size_t y)
350 struct stack_var *a = &stack_vars[x];
351 struct stack_var *b = &stack_vars[y];
352 if (x == y)
353 return false;
354 /* Partitions containing an SSA name result from gimple registers
355 with things like unsupported modes. They are top-level and
356 hence conflict with everything else. */
357 if (TREE_CODE (a->decl) == SSA_NAME || TREE_CODE (b->decl) == SSA_NAME)
358 return true;
360 if (!a->conflicts || !b->conflicts)
361 return false;
362 return bitmap_bit_p (a->conflicts, y);
365 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
366 enter its partition number into bitmap DATA. */
368 static bool
369 visit_op (gimple, tree op, tree, void *data)
371 bitmap active = (bitmap)data;
372 op = get_base_address (op);
373 if (op
374 && DECL_P (op)
375 && DECL_RTL_IF_SET (op) == pc_rtx)
377 size_t *v = decl_to_stack_part->get (op);
378 if (v)
379 bitmap_set_bit (active, *v);
381 return false;
384 /* Callback for walk_stmt_ops. If OP is a decl touched by add_stack_var
385 record conflicts between it and all currently active other partitions
386 from bitmap DATA. */
388 static bool
389 visit_conflict (gimple, tree op, tree, void *data)
391 bitmap active = (bitmap)data;
392 op = get_base_address (op);
393 if (op
394 && DECL_P (op)
395 && DECL_RTL_IF_SET (op) == pc_rtx)
397 size_t *v = decl_to_stack_part->get (op);
398 if (v && bitmap_set_bit (active, *v))
400 size_t num = *v;
401 bitmap_iterator bi;
402 unsigned i;
403 gcc_assert (num < stack_vars_num);
404 EXECUTE_IF_SET_IN_BITMAP (active, 0, i, bi)
405 add_stack_var_conflict (num, i);
408 return false;
411 /* Helper routine for add_scope_conflicts, calculating the active partitions
412 at the end of BB, leaving the result in WORK. We're called to generate
413 conflicts when FOR_CONFLICT is true, otherwise we're just tracking
414 liveness. */
416 static void
417 add_scope_conflicts_1 (basic_block bb, bitmap work, bool for_conflict)
419 edge e;
420 edge_iterator ei;
421 gimple_stmt_iterator gsi;
422 walk_stmt_load_store_addr_fn visit;
424 bitmap_clear (work);
425 FOR_EACH_EDGE (e, ei, bb->preds)
426 bitmap_ior_into (work, (bitmap)e->src->aux);
428 visit = visit_op;
430 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
432 gimple stmt = gsi_stmt (gsi);
433 walk_stmt_load_store_addr_ops (stmt, work, NULL, NULL, visit);
435 for (gsi = gsi_after_labels (bb); !gsi_end_p (gsi); gsi_next (&gsi))
437 gimple stmt = gsi_stmt (gsi);
439 if (gimple_clobber_p (stmt))
441 tree lhs = gimple_assign_lhs (stmt);
442 size_t *v;
443 /* Nested function lowering might introduce LHSs
444 that are COMPONENT_REFs. */
445 if (TREE_CODE (lhs) != VAR_DECL)
446 continue;
447 if (DECL_RTL_IF_SET (lhs) == pc_rtx
448 && (v = decl_to_stack_part->get (lhs)))
449 bitmap_clear_bit (work, *v);
451 else if (!is_gimple_debug (stmt))
453 if (for_conflict
454 && visit == visit_op)
456 /* If this is the first real instruction in this BB we need
457 to add conflicts for everything live at this point now.
458 Unlike classical liveness for named objects we can't
459 rely on seeing a def/use of the names we're interested in.
460 There might merely be indirect loads/stores. We'd not add any
461 conflicts for such partitions. */
462 bitmap_iterator bi;
463 unsigned i;
464 EXECUTE_IF_SET_IN_BITMAP (work, 0, i, bi)
466 struct stack_var *a = &stack_vars[i];
467 if (!a->conflicts)
468 a->conflicts = BITMAP_ALLOC (&stack_var_bitmap_obstack);
469 bitmap_ior_into (a->conflicts, work);
471 visit = visit_conflict;
473 walk_stmt_load_store_addr_ops (stmt, work, visit, visit, visit);
478 /* Generate stack partition conflicts between all partitions that are
479 simultaneously live. */
481 static void
482 add_scope_conflicts (void)
484 basic_block bb;
485 bool changed;
486 bitmap work = BITMAP_ALLOC (NULL);
487 int *rpo;
488 int n_bbs;
490 /* We approximate the live range of a stack variable by taking the first
491 mention of its name as starting point(s), and by the end-of-scope
492 death clobber added by gimplify as ending point(s) of the range.
493 This overapproximates in the case we for instance moved an address-taken
494 operation upward, without also moving a dereference to it upwards.
495 But it's conservatively correct as a variable never can hold values
496 before its name is mentioned at least once.
498 We then do a mostly classical bitmap liveness algorithm. */
500 FOR_ALL_BB_FN (bb, cfun)
501 bb->aux = BITMAP_ALLOC (&stack_var_bitmap_obstack);
503 rpo = XNEWVEC (int, last_basic_block_for_fn (cfun));
504 n_bbs = pre_and_rev_post_order_compute (NULL, rpo, false);
506 changed = true;
507 while (changed)
509 int i;
510 changed = false;
511 for (i = 0; i < n_bbs; i++)
513 bitmap active;
514 bb = BASIC_BLOCK_FOR_FN (cfun, rpo[i]);
515 active = (bitmap)bb->aux;
516 add_scope_conflicts_1 (bb, work, false);
517 if (bitmap_ior_into (active, work))
518 changed = true;
522 FOR_EACH_BB_FN (bb, cfun)
523 add_scope_conflicts_1 (bb, work, true);
525 free (rpo);
526 BITMAP_FREE (work);
527 FOR_ALL_BB_FN (bb, cfun)
528 BITMAP_FREE (bb->aux);
531 /* A subroutine of partition_stack_vars. A comparison function for qsort,
532 sorting an array of indices by the properties of the object. */
534 static int
535 stack_var_cmp (const void *a, const void *b)
537 size_t ia = *(const size_t *)a;
538 size_t ib = *(const size_t *)b;
539 unsigned int aligna = stack_vars[ia].alignb;
540 unsigned int alignb = stack_vars[ib].alignb;
541 HOST_WIDE_INT sizea = stack_vars[ia].size;
542 HOST_WIDE_INT sizeb = stack_vars[ib].size;
543 tree decla = stack_vars[ia].decl;
544 tree declb = stack_vars[ib].decl;
545 bool largea, largeb;
546 unsigned int uida, uidb;
548 /* Primary compare on "large" alignment. Large comes first. */
549 largea = (aligna * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
550 largeb = (alignb * BITS_PER_UNIT > MAX_SUPPORTED_STACK_ALIGNMENT);
551 if (largea != largeb)
552 return (int)largeb - (int)largea;
554 /* Secondary compare on size, decreasing */
555 if (sizea > sizeb)
556 return -1;
557 if (sizea < sizeb)
558 return 1;
560 /* Tertiary compare on true alignment, decreasing. */
561 if (aligna < alignb)
562 return -1;
563 if (aligna > alignb)
564 return 1;
566 /* Final compare on ID for sort stability, increasing.
567 Two SSA names are compared by their version, SSA names come before
568 non-SSA names, and two normal decls are compared by their DECL_UID. */
569 if (TREE_CODE (decla) == SSA_NAME)
571 if (TREE_CODE (declb) == SSA_NAME)
572 uida = SSA_NAME_VERSION (decla), uidb = SSA_NAME_VERSION (declb);
573 else
574 return -1;
576 else if (TREE_CODE (declb) == SSA_NAME)
577 return 1;
578 else
579 uida = DECL_UID (decla), uidb = DECL_UID (declb);
580 if (uida < uidb)
581 return 1;
582 if (uida > uidb)
583 return -1;
584 return 0;
587 struct part_traits : default_hashmap_traits
589 template<typename T>
590 static bool
591 is_deleted (T &e)
592 { return e.m_value == reinterpret_cast<void *> (1); }
594 template<typename T> static bool is_empty (T &e) { return e.m_value == NULL; }
595 template<typename T>
596 static void
597 mark_deleted (T &e)
598 { e.m_value = reinterpret_cast<T> (1); }
600 template<typename T>
601 static void
602 mark_empty (T &e)
603 { e.m_value = NULL; }
606 typedef hash_map<size_t, bitmap, part_traits> part_hashmap;
608 /* If the points-to solution *PI points to variables that are in a partition
609 together with other variables add all partition members to the pointed-to
610 variables bitmap. */
612 static void
613 add_partitioned_vars_to_ptset (struct pt_solution *pt,
614 part_hashmap *decls_to_partitions,
615 hash_set<bitmap> *visited, bitmap temp)
617 bitmap_iterator bi;
618 unsigned i;
619 bitmap *part;
621 if (pt->anything
622 || pt->vars == NULL
623 /* The pointed-to vars bitmap is shared, it is enough to
624 visit it once. */
625 || visited->add (pt->vars))
626 return;
628 bitmap_clear (temp);
630 /* By using a temporary bitmap to store all members of the partitions
631 we have to add we make sure to visit each of the partitions only
632 once. */
633 EXECUTE_IF_SET_IN_BITMAP (pt->vars, 0, i, bi)
634 if ((!temp
635 || !bitmap_bit_p (temp, i))
636 && (part = decls_to_partitions->get (i)))
637 bitmap_ior_into (temp, *part);
638 if (!bitmap_empty_p (temp))
639 bitmap_ior_into (pt->vars, temp);
642 /* Update points-to sets based on partition info, so we can use them on RTL.
643 The bitmaps representing stack partitions will be saved until expand,
644 where partitioned decls used as bases in memory expressions will be
645 rewritten. */
647 static void
648 update_alias_info_with_stack_vars (void)
650 part_hashmap *decls_to_partitions = NULL;
651 size_t i, j;
652 tree var = NULL_TREE;
654 for (i = 0; i < stack_vars_num; i++)
656 bitmap part = NULL;
657 tree name;
658 struct ptr_info_def *pi;
660 /* Not interested in partitions with single variable. */
661 if (stack_vars[i].representative != i
662 || stack_vars[i].next == EOC)
663 continue;
665 if (!decls_to_partitions)
667 decls_to_partitions = new part_hashmap;
668 cfun->gimple_df->decls_to_pointers = new hash_map<tree, tree>;
671 /* Create an SSA_NAME that points to the partition for use
672 as base during alias-oracle queries on RTL for bases that
673 have been partitioned. */
674 if (var == NULL_TREE)
675 var = create_tmp_var (ptr_type_node, NULL);
676 name = make_ssa_name (var, NULL);
678 /* Create bitmaps representing partitions. They will be used for
679 points-to sets later, so use GGC alloc. */
680 part = BITMAP_GGC_ALLOC ();
681 for (j = i; j != EOC; j = stack_vars[j].next)
683 tree decl = stack_vars[j].decl;
684 unsigned int uid = DECL_PT_UID (decl);
685 bitmap_set_bit (part, uid);
686 decls_to_partitions->put (uid, part);
687 cfun->gimple_df->decls_to_pointers->put (decl, name);
688 if (TREE_ADDRESSABLE (decl))
689 TREE_ADDRESSABLE (name) = 1;
692 /* Make the SSA name point to all partition members. */
693 pi = get_ptr_info (name);
694 pt_solution_set (&pi->pt, part, false);
697 /* Make all points-to sets that contain one member of a partition
698 contain all members of the partition. */
699 if (decls_to_partitions)
701 unsigned i;
702 hash_set<bitmap> visited;
703 bitmap temp = BITMAP_ALLOC (&stack_var_bitmap_obstack);
705 for (i = 1; i < num_ssa_names; i++)
707 tree name = ssa_name (i);
708 struct ptr_info_def *pi;
710 if (name
711 && POINTER_TYPE_P (TREE_TYPE (name))
712 && ((pi = SSA_NAME_PTR_INFO (name)) != NULL))
713 add_partitioned_vars_to_ptset (&pi->pt, decls_to_partitions,
714 &visited, temp);
717 add_partitioned_vars_to_ptset (&cfun->gimple_df->escaped,
718 decls_to_partitions, &visited, temp);
720 delete decls_to_partitions;
721 BITMAP_FREE (temp);
725 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
726 partitioning algorithm. Partitions A and B are known to be non-conflicting.
727 Merge them into a single partition A. */
729 static void
730 union_stack_vars (size_t a, size_t b)
732 struct stack_var *vb = &stack_vars[b];
733 bitmap_iterator bi;
734 unsigned u;
736 gcc_assert (stack_vars[b].next == EOC);
737 /* Add B to A's partition. */
738 stack_vars[b].next = stack_vars[a].next;
739 stack_vars[b].representative = a;
740 stack_vars[a].next = b;
742 /* Update the required alignment of partition A to account for B. */
743 if (stack_vars[a].alignb < stack_vars[b].alignb)
744 stack_vars[a].alignb = stack_vars[b].alignb;
746 /* Update the interference graph and merge the conflicts. */
747 if (vb->conflicts)
749 EXECUTE_IF_SET_IN_BITMAP (vb->conflicts, 0, u, bi)
750 add_stack_var_conflict (a, stack_vars[u].representative);
751 BITMAP_FREE (vb->conflicts);
755 /* A subroutine of expand_used_vars. Binpack the variables into
756 partitions constrained by the interference graph. The overall
757 algorithm used is as follows:
759 Sort the objects by size in descending order.
760 For each object A {
761 S = size(A)
762 O = 0
763 loop {
764 Look for the largest non-conflicting object B with size <= S.
765 UNION (A, B)
770 static void
771 partition_stack_vars (void)
773 size_t si, sj, n = stack_vars_num;
775 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
776 for (si = 0; si < n; ++si)
777 stack_vars_sorted[si] = si;
779 if (n == 1)
780 return;
782 qsort (stack_vars_sorted, n, sizeof (size_t), stack_var_cmp);
784 for (si = 0; si < n; ++si)
786 size_t i = stack_vars_sorted[si];
787 unsigned int ialign = stack_vars[i].alignb;
788 HOST_WIDE_INT isize = stack_vars[i].size;
790 /* Ignore objects that aren't partition representatives. If we
791 see a var that is not a partition representative, it must
792 have been merged earlier. */
793 if (stack_vars[i].representative != i)
794 continue;
796 for (sj = si + 1; sj < n; ++sj)
798 size_t j = stack_vars_sorted[sj];
799 unsigned int jalign = stack_vars[j].alignb;
800 HOST_WIDE_INT jsize = stack_vars[j].size;
802 /* Ignore objects that aren't partition representatives. */
803 if (stack_vars[j].representative != j)
804 continue;
806 /* Do not mix objects of "small" (supported) alignment
807 and "large" (unsupported) alignment. */
808 if ((ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
809 != (jalign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT))
810 break;
812 /* For Address Sanitizer do not mix objects with different
813 sizes, as the shorter vars wouldn't be adequately protected.
814 Don't do that for "large" (unsupported) alignment objects,
815 those aren't protected anyway. */
816 if ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK && isize != jsize
817 && ialign * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
818 break;
820 /* Ignore conflicting objects. */
821 if (stack_var_conflict_p (i, j))
822 continue;
824 /* UNION the objects, placing J at OFFSET. */
825 union_stack_vars (i, j);
829 update_alias_info_with_stack_vars ();
832 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
834 static void
835 dump_stack_var_partition (void)
837 size_t si, i, j, n = stack_vars_num;
839 for (si = 0; si < n; ++si)
841 i = stack_vars_sorted[si];
843 /* Skip variables that aren't partition representatives, for now. */
844 if (stack_vars[i].representative != i)
845 continue;
847 fprintf (dump_file, "Partition %lu: size " HOST_WIDE_INT_PRINT_DEC
848 " align %u\n", (unsigned long) i, stack_vars[i].size,
849 stack_vars[i].alignb);
851 for (j = i; j != EOC; j = stack_vars[j].next)
853 fputc ('\t', dump_file);
854 print_generic_expr (dump_file, stack_vars[j].decl, dump_flags);
856 fputc ('\n', dump_file);
860 /* Assign rtl to DECL at BASE + OFFSET. */
862 static void
863 expand_one_stack_var_at (tree decl, rtx base, unsigned base_align,
864 HOST_WIDE_INT offset)
866 unsigned align;
867 rtx x;
869 /* If this fails, we've overflowed the stack frame. Error nicely? */
870 gcc_assert (offset == trunc_int_for_mode (offset, Pmode));
872 x = plus_constant (Pmode, base, offset);
873 x = gen_rtx_MEM (DECL_MODE (SSAVAR (decl)), x);
875 if (TREE_CODE (decl) != SSA_NAME)
877 /* Set alignment we actually gave this decl if it isn't an SSA name.
878 If it is we generate stack slots only accidentally so it isn't as
879 important, we'll simply use the alignment that is already set. */
880 if (base == virtual_stack_vars_rtx)
881 offset -= frame_phase;
882 align = offset & -offset;
883 align *= BITS_PER_UNIT;
884 if (align == 0 || align > base_align)
885 align = base_align;
887 /* One would think that we could assert that we're not decreasing
888 alignment here, but (at least) the i386 port does exactly this
889 via the MINIMUM_ALIGNMENT hook. */
891 DECL_ALIGN (decl) = align;
892 DECL_USER_ALIGN (decl) = 0;
895 set_mem_attributes (x, SSAVAR (decl), true);
896 set_rtl (decl, x);
899 struct stack_vars_data
901 /* Vector of offset pairs, always end of some padding followed
902 by start of the padding that needs Address Sanitizer protection.
903 The vector is in reversed, highest offset pairs come first. */
904 vec<HOST_WIDE_INT> asan_vec;
906 /* Vector of partition representative decls in between the paddings. */
907 vec<tree> asan_decl_vec;
909 /* Base pseudo register for Address Sanitizer protected automatic vars. */
910 rtx asan_base;
912 /* Alignment needed for the Address Sanitizer protected automatic vars. */
913 unsigned int asan_alignb;
916 /* A subroutine of expand_used_vars. Give each partition representative
917 a unique location within the stack frame. Update each partition member
918 with that location. */
920 static void
921 expand_stack_vars (bool (*pred) (size_t), struct stack_vars_data *data)
923 size_t si, i, j, n = stack_vars_num;
924 HOST_WIDE_INT large_size = 0, large_alloc = 0;
925 rtx large_base = NULL;
926 unsigned large_align = 0;
927 tree decl;
929 /* Determine if there are any variables requiring "large" alignment.
930 Since these are dynamically allocated, we only process these if
931 no predicate involved. */
932 large_align = stack_vars[stack_vars_sorted[0]].alignb * BITS_PER_UNIT;
933 if (pred == NULL && large_align > MAX_SUPPORTED_STACK_ALIGNMENT)
935 /* Find the total size of these variables. */
936 for (si = 0; si < n; ++si)
938 unsigned alignb;
940 i = stack_vars_sorted[si];
941 alignb = stack_vars[i].alignb;
943 /* Stop when we get to the first decl with "small" alignment. */
944 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
945 break;
947 /* Skip variables that aren't partition representatives. */
948 if (stack_vars[i].representative != i)
949 continue;
951 /* Skip variables that have already had rtl assigned. See also
952 add_stack_var where we perpetrate this pc_rtx hack. */
953 decl = stack_vars[i].decl;
954 if ((TREE_CODE (decl) == SSA_NAME
955 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)]
956 : DECL_RTL (decl)) != pc_rtx)
957 continue;
959 large_size += alignb - 1;
960 large_size &= -(HOST_WIDE_INT)alignb;
961 large_size += stack_vars[i].size;
964 /* If there were any, allocate space. */
965 if (large_size > 0)
966 large_base = allocate_dynamic_stack_space (GEN_INT (large_size), 0,
967 large_align, true);
970 for (si = 0; si < n; ++si)
972 rtx base;
973 unsigned base_align, alignb;
974 HOST_WIDE_INT offset;
976 i = stack_vars_sorted[si];
978 /* Skip variables that aren't partition representatives, for now. */
979 if (stack_vars[i].representative != i)
980 continue;
982 /* Skip variables that have already had rtl assigned. See also
983 add_stack_var where we perpetrate this pc_rtx hack. */
984 decl = stack_vars[i].decl;
985 if ((TREE_CODE (decl) == SSA_NAME
986 ? SA.partition_to_pseudo[var_to_partition (SA.map, decl)]
987 : DECL_RTL (decl)) != pc_rtx)
988 continue;
990 /* Check the predicate to see whether this variable should be
991 allocated in this pass. */
992 if (pred && !pred (i))
993 continue;
995 alignb = stack_vars[i].alignb;
996 if (alignb * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT)
998 base = virtual_stack_vars_rtx;
999 if ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK && pred)
1001 HOST_WIDE_INT prev_offset = frame_offset;
1002 tree repr_decl = NULL_TREE;
1004 offset
1005 = alloc_stack_frame_space (stack_vars[i].size
1006 + ASAN_RED_ZONE_SIZE,
1007 MAX (alignb, ASAN_RED_ZONE_SIZE));
1008 data->asan_vec.safe_push (prev_offset);
1009 data->asan_vec.safe_push (offset + stack_vars[i].size);
1010 /* Find best representative of the partition.
1011 Prefer those with DECL_NAME, even better
1012 satisfying asan_protect_stack_decl predicate. */
1013 for (j = i; j != EOC; j = stack_vars[j].next)
1014 if (asan_protect_stack_decl (stack_vars[j].decl)
1015 && DECL_NAME (stack_vars[j].decl))
1017 repr_decl = stack_vars[j].decl;
1018 break;
1020 else if (repr_decl == NULL_TREE
1021 && DECL_P (stack_vars[j].decl)
1022 && DECL_NAME (stack_vars[j].decl))
1023 repr_decl = stack_vars[j].decl;
1024 if (repr_decl == NULL_TREE)
1025 repr_decl = stack_vars[i].decl;
1026 data->asan_decl_vec.safe_push (repr_decl);
1027 data->asan_alignb = MAX (data->asan_alignb, alignb);
1028 if (data->asan_base == NULL)
1029 data->asan_base = gen_reg_rtx (Pmode);
1030 base = data->asan_base;
1032 if (!STRICT_ALIGNMENT)
1033 base_align = crtl->max_used_stack_slot_alignment;
1034 else
1035 base_align = MAX (crtl->max_used_stack_slot_alignment,
1036 GET_MODE_ALIGNMENT (SImode)
1037 << ASAN_SHADOW_SHIFT);
1039 else
1041 offset = alloc_stack_frame_space (stack_vars[i].size, alignb);
1042 base_align = crtl->max_used_stack_slot_alignment;
1045 else
1047 /* Large alignment is only processed in the last pass. */
1048 if (pred)
1049 continue;
1050 gcc_assert (large_base != NULL);
1052 large_alloc += alignb - 1;
1053 large_alloc &= -(HOST_WIDE_INT)alignb;
1054 offset = large_alloc;
1055 large_alloc += stack_vars[i].size;
1057 base = large_base;
1058 base_align = large_align;
1061 /* Create rtl for each variable based on their location within the
1062 partition. */
1063 for (j = i; j != EOC; j = stack_vars[j].next)
1065 expand_one_stack_var_at (stack_vars[j].decl,
1066 base, base_align,
1067 offset);
1071 gcc_assert (large_alloc == large_size);
1074 /* Take into account all sizes of partitions and reset DECL_RTLs. */
1075 static HOST_WIDE_INT
1076 account_stack_vars (void)
1078 size_t si, j, i, n = stack_vars_num;
1079 HOST_WIDE_INT size = 0;
1081 for (si = 0; si < n; ++si)
1083 i = stack_vars_sorted[si];
1085 /* Skip variables that aren't partition representatives, for now. */
1086 if (stack_vars[i].representative != i)
1087 continue;
1089 size += stack_vars[i].size;
1090 for (j = i; j != EOC; j = stack_vars[j].next)
1091 set_rtl (stack_vars[j].decl, NULL);
1093 return size;
1096 /* A subroutine of expand_one_var. Called to immediately assign rtl
1097 to a variable to be allocated in the stack frame. */
1099 static void
1100 expand_one_stack_var (tree var)
1102 HOST_WIDE_INT size, offset;
1103 unsigned byte_align;
1105 size = tree_to_uhwi (DECL_SIZE_UNIT (SSAVAR (var)));
1106 byte_align = align_local_variable (SSAVAR (var));
1108 /* We handle highly aligned variables in expand_stack_vars. */
1109 gcc_assert (byte_align * BITS_PER_UNIT <= MAX_SUPPORTED_STACK_ALIGNMENT);
1111 offset = alloc_stack_frame_space (size, byte_align);
1113 expand_one_stack_var_at (var, virtual_stack_vars_rtx,
1114 crtl->max_used_stack_slot_alignment, offset);
1117 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1118 that will reside in a hard register. */
1120 static void
1121 expand_one_hard_reg_var (tree var)
1123 rest_of_decl_compilation (var, 0, 0);
1126 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
1127 that will reside in a pseudo register. */
1129 static void
1130 expand_one_register_var (tree var)
1132 tree decl = SSAVAR (var);
1133 tree type = TREE_TYPE (decl);
1134 enum machine_mode reg_mode = promote_decl_mode (decl, NULL);
1135 rtx x = gen_reg_rtx (reg_mode);
1137 set_rtl (var, x);
1139 /* Note if the object is a user variable. */
1140 if (!DECL_ARTIFICIAL (decl))
1141 mark_user_reg (x);
1143 if (POINTER_TYPE_P (type))
1144 mark_reg_pointer (x, get_pointer_alignment (var));
1147 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
1148 has some associated error, e.g. its type is error-mark. We just need
1149 to pick something that won't crash the rest of the compiler. */
1151 static void
1152 expand_one_error_var (tree var)
1154 enum machine_mode mode = DECL_MODE (var);
1155 rtx x;
1157 if (mode == BLKmode)
1158 x = gen_rtx_MEM (BLKmode, const0_rtx);
1159 else if (mode == VOIDmode)
1160 x = const0_rtx;
1161 else
1162 x = gen_reg_rtx (mode);
1164 SET_DECL_RTL (var, x);
1167 /* A subroutine of expand_one_var. VAR is a variable that will be
1168 allocated to the local stack frame. Return true if we wish to
1169 add VAR to STACK_VARS so that it will be coalesced with other
1170 variables. Return false to allocate VAR immediately.
1172 This function is used to reduce the number of variables considered
1173 for coalescing, which reduces the size of the quadratic problem. */
1175 static bool
1176 defer_stack_allocation (tree var, bool toplevel)
1178 /* Whether the variable is small enough for immediate allocation not to be
1179 a problem with regard to the frame size. */
1180 bool smallish
1181 = ((HOST_WIDE_INT) tree_to_uhwi (DECL_SIZE_UNIT (var))
1182 < PARAM_VALUE (PARAM_MIN_SIZE_FOR_STACK_SHARING));
1184 /* If stack protection is enabled, *all* stack variables must be deferred,
1185 so that we can re-order the strings to the top of the frame.
1186 Similarly for Address Sanitizer. */
1187 if (flag_stack_protect || ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK))
1188 return true;
1190 /* We handle "large" alignment via dynamic allocation. We want to handle
1191 this extra complication in only one place, so defer them. */
1192 if (DECL_ALIGN (var) > MAX_SUPPORTED_STACK_ALIGNMENT)
1193 return true;
1195 /* When optimization is enabled, DECL_IGNORED_P variables originally scoped
1196 might be detached from their block and appear at toplevel when we reach
1197 here. We want to coalesce them with variables from other blocks when
1198 the immediate contribution to the frame size would be noticeable. */
1199 if (toplevel && optimize > 0 && DECL_IGNORED_P (var) && !smallish)
1200 return true;
1202 /* Variables declared in the outermost scope automatically conflict
1203 with every other variable. The only reason to want to defer them
1204 at all is that, after sorting, we can more efficiently pack
1205 small variables in the stack frame. Continue to defer at -O2. */
1206 if (toplevel && optimize < 2)
1207 return false;
1209 /* Without optimization, *most* variables are allocated from the
1210 stack, which makes the quadratic problem large exactly when we
1211 want compilation to proceed as quickly as possible. On the
1212 other hand, we don't want the function's stack frame size to
1213 get completely out of hand. So we avoid adding scalars and
1214 "small" aggregates to the list at all. */
1215 if (optimize == 0 && smallish)
1216 return false;
1218 return true;
1221 /* A subroutine of expand_used_vars. Expand one variable according to
1222 its flavor. Variables to be placed on the stack are not actually
1223 expanded yet, merely recorded.
1224 When REALLY_EXPAND is false, only add stack values to be allocated.
1225 Return stack usage this variable is supposed to take.
1228 static HOST_WIDE_INT
1229 expand_one_var (tree var, bool toplevel, bool really_expand)
1231 unsigned int align = BITS_PER_UNIT;
1232 tree origvar = var;
1234 var = SSAVAR (var);
1236 if (TREE_TYPE (var) != error_mark_node && TREE_CODE (var) == VAR_DECL)
1238 /* Because we don't know if VAR will be in register or on stack,
1239 we conservatively assume it will be on stack even if VAR is
1240 eventually put into register after RA pass. For non-automatic
1241 variables, which won't be on stack, we collect alignment of
1242 type and ignore user specified alignment. Similarly for
1243 SSA_NAMEs for which use_register_for_decl returns true. */
1244 if (TREE_STATIC (var)
1245 || DECL_EXTERNAL (var)
1246 || (TREE_CODE (origvar) == SSA_NAME && use_register_for_decl (var)))
1247 align = MINIMUM_ALIGNMENT (TREE_TYPE (var),
1248 TYPE_MODE (TREE_TYPE (var)),
1249 TYPE_ALIGN (TREE_TYPE (var)));
1250 else if (DECL_HAS_VALUE_EXPR_P (var)
1251 || (DECL_RTL_SET_P (var) && MEM_P (DECL_RTL (var))))
1252 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1253 or variables which were assigned a stack slot already by
1254 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1255 changed from the offset chosen to it. */
1256 align = crtl->stack_alignment_estimated;
1257 else
1258 align = MINIMUM_ALIGNMENT (var, DECL_MODE (var), DECL_ALIGN (var));
1260 /* If the variable alignment is very large we'll dynamicaly allocate
1261 it, which means that in-frame portion is just a pointer. */
1262 if (align > MAX_SUPPORTED_STACK_ALIGNMENT)
1263 align = POINTER_SIZE;
1266 if (SUPPORTS_STACK_ALIGNMENT
1267 && crtl->stack_alignment_estimated < align)
1269 /* stack_alignment_estimated shouldn't change after stack
1270 realign decision made */
1271 gcc_assert (!crtl->stack_realign_processed);
1272 crtl->stack_alignment_estimated = align;
1275 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1276 So here we only make sure stack_alignment_needed >= align. */
1277 if (crtl->stack_alignment_needed < align)
1278 crtl->stack_alignment_needed = align;
1279 if (crtl->max_used_stack_slot_alignment < align)
1280 crtl->max_used_stack_slot_alignment = align;
1282 if (TREE_CODE (origvar) == SSA_NAME)
1284 gcc_assert (TREE_CODE (var) != VAR_DECL
1285 || (!DECL_EXTERNAL (var)
1286 && !DECL_HAS_VALUE_EXPR_P (var)
1287 && !TREE_STATIC (var)
1288 && TREE_TYPE (var) != error_mark_node
1289 && !DECL_HARD_REGISTER (var)
1290 && really_expand));
1292 if (TREE_CODE (var) != VAR_DECL && TREE_CODE (origvar) != SSA_NAME)
1294 else if (DECL_EXTERNAL (var))
1296 else if (DECL_HAS_VALUE_EXPR_P (var))
1298 else if (TREE_STATIC (var))
1300 else if (TREE_CODE (origvar) != SSA_NAME && DECL_RTL_SET_P (var))
1302 else if (TREE_TYPE (var) == error_mark_node)
1304 if (really_expand)
1305 expand_one_error_var (var);
1307 else if (TREE_CODE (var) == VAR_DECL && DECL_HARD_REGISTER (var))
1309 if (really_expand)
1311 expand_one_hard_reg_var (var);
1312 if (!DECL_HARD_REGISTER (var))
1313 /* Invalid register specification. */
1314 expand_one_error_var (var);
1317 else if (use_register_for_decl (var))
1319 if (really_expand)
1320 expand_one_register_var (origvar);
1322 else if (! valid_constant_size_p (DECL_SIZE_UNIT (var)))
1324 /* Reject variables which cover more than half of the address-space. */
1325 if (really_expand)
1327 error ("size of variable %q+D is too large", var);
1328 expand_one_error_var (var);
1331 else if (defer_stack_allocation (var, toplevel))
1332 add_stack_var (origvar);
1333 else
1335 if (really_expand)
1336 expand_one_stack_var (origvar);
1337 return tree_to_uhwi (DECL_SIZE_UNIT (var));
1339 return 0;
1342 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1343 expanding variables. Those variables that can be put into registers
1344 are allocated pseudos; those that can't are put on the stack.
1346 TOPLEVEL is true if this is the outermost BLOCK. */
1348 static void
1349 expand_used_vars_for_block (tree block, bool toplevel)
1351 tree t;
1353 /* Expand all variables at this level. */
1354 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1355 if (TREE_USED (t)
1356 && ((TREE_CODE (t) != VAR_DECL && TREE_CODE (t) != RESULT_DECL)
1357 || !DECL_NONSHAREABLE (t)))
1358 expand_one_var (t, toplevel, true);
1360 /* Expand all variables at containing levels. */
1361 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1362 expand_used_vars_for_block (t, false);
1365 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1366 and clear TREE_USED on all local variables. */
1368 static void
1369 clear_tree_used (tree block)
1371 tree t;
1373 for (t = BLOCK_VARS (block); t ; t = DECL_CHAIN (t))
1374 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1375 if ((TREE_CODE (t) != VAR_DECL && TREE_CODE (t) != RESULT_DECL)
1376 || !DECL_NONSHAREABLE (t))
1377 TREE_USED (t) = 0;
1379 for (t = BLOCK_SUBBLOCKS (block); t ; t = BLOCK_CHAIN (t))
1380 clear_tree_used (t);
1383 enum {
1384 SPCT_FLAG_DEFAULT = 1,
1385 SPCT_FLAG_ALL = 2,
1386 SPCT_FLAG_STRONG = 3
1389 /* Examine TYPE and determine a bit mask of the following features. */
1391 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1392 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1393 #define SPCT_HAS_ARRAY 4
1394 #define SPCT_HAS_AGGREGATE 8
1396 static unsigned int
1397 stack_protect_classify_type (tree type)
1399 unsigned int ret = 0;
1400 tree t;
1402 switch (TREE_CODE (type))
1404 case ARRAY_TYPE:
1405 t = TYPE_MAIN_VARIANT (TREE_TYPE (type));
1406 if (t == char_type_node
1407 || t == signed_char_type_node
1408 || t == unsigned_char_type_node)
1410 unsigned HOST_WIDE_INT max = PARAM_VALUE (PARAM_SSP_BUFFER_SIZE);
1411 unsigned HOST_WIDE_INT len;
1413 if (!TYPE_SIZE_UNIT (type)
1414 || !tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
1415 len = max;
1416 else
1417 len = tree_to_uhwi (TYPE_SIZE_UNIT (type));
1419 if (len < max)
1420 ret = SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_ARRAY;
1421 else
1422 ret = SPCT_HAS_LARGE_CHAR_ARRAY | SPCT_HAS_ARRAY;
1424 else
1425 ret = SPCT_HAS_ARRAY;
1426 break;
1428 case UNION_TYPE:
1429 case QUAL_UNION_TYPE:
1430 case RECORD_TYPE:
1431 ret = SPCT_HAS_AGGREGATE;
1432 for (t = TYPE_FIELDS (type); t ; t = TREE_CHAIN (t))
1433 if (TREE_CODE (t) == FIELD_DECL)
1434 ret |= stack_protect_classify_type (TREE_TYPE (t));
1435 break;
1437 default:
1438 break;
1441 return ret;
1444 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1445 part of the local stack frame. Remember if we ever return nonzero for
1446 any variable in this function. The return value is the phase number in
1447 which the variable should be allocated. */
1449 static int
1450 stack_protect_decl_phase (tree decl)
1452 unsigned int bits = stack_protect_classify_type (TREE_TYPE (decl));
1453 int ret = 0;
1455 if (bits & SPCT_HAS_SMALL_CHAR_ARRAY)
1456 has_short_buffer = true;
1458 if (flag_stack_protect == SPCT_FLAG_ALL
1459 || flag_stack_protect == SPCT_FLAG_STRONG)
1461 if ((bits & (SPCT_HAS_SMALL_CHAR_ARRAY | SPCT_HAS_LARGE_CHAR_ARRAY))
1462 && !(bits & SPCT_HAS_AGGREGATE))
1463 ret = 1;
1464 else if (bits & SPCT_HAS_ARRAY)
1465 ret = 2;
1467 else
1468 ret = (bits & SPCT_HAS_LARGE_CHAR_ARRAY) != 0;
1470 if (ret)
1471 has_protected_decls = true;
1473 return ret;
1476 /* Two helper routines that check for phase 1 and phase 2. These are used
1477 as callbacks for expand_stack_vars. */
1479 static bool
1480 stack_protect_decl_phase_1 (size_t i)
1482 return stack_protect_decl_phase (stack_vars[i].decl) == 1;
1485 static bool
1486 stack_protect_decl_phase_2 (size_t i)
1488 return stack_protect_decl_phase (stack_vars[i].decl) == 2;
1491 /* And helper function that checks for asan phase (with stack protector
1492 it is phase 3). This is used as callback for expand_stack_vars.
1493 Returns true if any of the vars in the partition need to be protected. */
1495 static bool
1496 asan_decl_phase_3 (size_t i)
1498 while (i != EOC)
1500 if (asan_protect_stack_decl (stack_vars[i].decl))
1501 return true;
1502 i = stack_vars[i].next;
1504 return false;
1507 /* Ensure that variables in different stack protection phases conflict
1508 so that they are not merged and share the same stack slot. */
1510 static void
1511 add_stack_protection_conflicts (void)
1513 size_t i, j, n = stack_vars_num;
1514 unsigned char *phase;
1516 phase = XNEWVEC (unsigned char, n);
1517 for (i = 0; i < n; ++i)
1518 phase[i] = stack_protect_decl_phase (stack_vars[i].decl);
1520 for (i = 0; i < n; ++i)
1522 unsigned char ph_i = phase[i];
1523 for (j = i + 1; j < n; ++j)
1524 if (ph_i != phase[j])
1525 add_stack_var_conflict (i, j);
1528 XDELETEVEC (phase);
1531 /* Create a decl for the guard at the top of the stack frame. */
1533 static void
1534 create_stack_guard (void)
1536 tree guard = build_decl (DECL_SOURCE_LOCATION (current_function_decl),
1537 VAR_DECL, NULL, ptr_type_node);
1538 TREE_THIS_VOLATILE (guard) = 1;
1539 TREE_USED (guard) = 1;
1540 expand_one_stack_var (guard);
1541 crtl->stack_protect_guard = guard;
1544 /* Prepare for expanding variables. */
1545 static void
1546 init_vars_expansion (void)
1548 /* Conflict bitmaps, and a few related temporary bitmaps, go here. */
1549 bitmap_obstack_initialize (&stack_var_bitmap_obstack);
1551 /* A map from decl to stack partition. */
1552 decl_to_stack_part = new hash_map<tree, size_t>;
1554 /* Initialize local stack smashing state. */
1555 has_protected_decls = false;
1556 has_short_buffer = false;
1559 /* Free up stack variable graph data. */
1560 static void
1561 fini_vars_expansion (void)
1563 bitmap_obstack_release (&stack_var_bitmap_obstack);
1564 if (stack_vars)
1565 XDELETEVEC (stack_vars);
1566 if (stack_vars_sorted)
1567 XDELETEVEC (stack_vars_sorted);
1568 stack_vars = NULL;
1569 stack_vars_sorted = NULL;
1570 stack_vars_alloc = stack_vars_num = 0;
1571 delete decl_to_stack_part;
1572 decl_to_stack_part = NULL;
1575 /* Make a fair guess for the size of the stack frame of the function
1576 in NODE. This doesn't have to be exact, the result is only used in
1577 the inline heuristics. So we don't want to run the full stack var
1578 packing algorithm (which is quadratic in the number of stack vars).
1579 Instead, we calculate the total size of all stack vars. This turns
1580 out to be a pretty fair estimate -- packing of stack vars doesn't
1581 happen very often. */
1583 HOST_WIDE_INT
1584 estimated_stack_frame_size (struct cgraph_node *node)
1586 HOST_WIDE_INT size = 0;
1587 size_t i;
1588 tree var;
1589 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
1591 push_cfun (fn);
1593 init_vars_expansion ();
1595 FOR_EACH_LOCAL_DECL (fn, i, var)
1596 if (auto_var_in_fn_p (var, fn->decl))
1597 size += expand_one_var (var, true, false);
1599 if (stack_vars_num > 0)
1601 /* Fake sorting the stack vars for account_stack_vars (). */
1602 stack_vars_sorted = XNEWVEC (size_t, stack_vars_num);
1603 for (i = 0; i < stack_vars_num; ++i)
1604 stack_vars_sorted[i] = i;
1605 size += account_stack_vars ();
1608 fini_vars_expansion ();
1609 pop_cfun ();
1610 return size;
1613 /* Helper routine to check if a record or union contains an array field. */
1615 static int
1616 record_or_union_type_has_array_p (const_tree tree_type)
1618 tree fields = TYPE_FIELDS (tree_type);
1619 tree f;
1621 for (f = fields; f; f = DECL_CHAIN (f))
1622 if (TREE_CODE (f) == FIELD_DECL)
1624 tree field_type = TREE_TYPE (f);
1625 if (RECORD_OR_UNION_TYPE_P (field_type)
1626 && record_or_union_type_has_array_p (field_type))
1627 return 1;
1628 if (TREE_CODE (field_type) == ARRAY_TYPE)
1629 return 1;
1631 return 0;
1634 /* Check if the current function has local referenced variables that
1635 have their addresses taken, contain an array, or are arrays. */
1637 static bool
1638 stack_protect_decl_p ()
1640 unsigned i;
1641 tree var;
1643 FOR_EACH_LOCAL_DECL (cfun, i, var)
1644 if (!is_global_var (var))
1646 tree var_type = TREE_TYPE (var);
1647 if (TREE_CODE (var) == VAR_DECL
1648 && (TREE_CODE (var_type) == ARRAY_TYPE
1649 || TREE_ADDRESSABLE (var)
1650 || (RECORD_OR_UNION_TYPE_P (var_type)
1651 && record_or_union_type_has_array_p (var_type))))
1652 return true;
1654 return false;
1657 /* Check if the current function has calls that use a return slot. */
1659 static bool
1660 stack_protect_return_slot_p ()
1662 basic_block bb;
1664 FOR_ALL_BB_FN (bb, cfun)
1665 for (gimple_stmt_iterator gsi = gsi_start_bb (bb);
1666 !gsi_end_p (gsi); gsi_next (&gsi))
1668 gimple stmt = gsi_stmt (gsi);
1669 /* This assumes that calls to internal-only functions never
1670 use a return slot. */
1671 if (is_gimple_call (stmt)
1672 && !gimple_call_internal_p (stmt)
1673 && aggregate_value_p (TREE_TYPE (gimple_call_fntype (stmt)),
1674 gimple_call_fndecl (stmt)))
1675 return true;
1677 return false;
1680 /* Expand all variables used in the function. */
1682 static rtx_insn *
1683 expand_used_vars (void)
1685 tree var, outer_block = DECL_INITIAL (current_function_decl);
1686 vec<tree> maybe_local_decls = vNULL;
1687 rtx_insn *var_end_seq = NULL;
1688 unsigned i;
1689 unsigned len;
1690 bool gen_stack_protect_signal = false;
1692 /* Compute the phase of the stack frame for this function. */
1694 int align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
1695 int off = STARTING_FRAME_OFFSET % align;
1696 frame_phase = off ? align - off : 0;
1699 /* Set TREE_USED on all variables in the local_decls. */
1700 FOR_EACH_LOCAL_DECL (cfun, i, var)
1701 TREE_USED (var) = 1;
1702 /* Clear TREE_USED on all variables associated with a block scope. */
1703 clear_tree_used (DECL_INITIAL (current_function_decl));
1705 init_vars_expansion ();
1707 hash_map<tree, tree> ssa_name_decls;
1708 for (i = 0; i < SA.map->num_partitions; i++)
1710 tree var = partition_to_var (SA.map, i);
1712 gcc_assert (!virtual_operand_p (var));
1714 /* Assign decls to each SSA name partition, share decls for partitions
1715 we could have coalesced (those with the same type). */
1716 if (SSA_NAME_VAR (var) == NULL_TREE)
1718 tree *slot = &ssa_name_decls.get_or_insert (TREE_TYPE (var));
1719 if (!*slot)
1720 *slot = create_tmp_reg (TREE_TYPE (var), NULL);
1721 replace_ssa_name_symbol (var, *slot);
1724 /* Always allocate space for partitions based on VAR_DECLs. But for
1725 those based on PARM_DECLs or RESULT_DECLs and which matter for the
1726 debug info, there is no need to do so if optimization is disabled
1727 because all the SSA_NAMEs based on these DECLs have been coalesced
1728 into a single partition, which is thus assigned the canonical RTL
1729 location of the DECLs. If in_lto_p, we can't rely on optimize,
1730 a function could be compiled with -O1 -flto first and only the
1731 link performed at -O0. */
1732 if (TREE_CODE (SSA_NAME_VAR (var)) == VAR_DECL)
1733 expand_one_var (var, true, true);
1734 else if (DECL_IGNORED_P (SSA_NAME_VAR (var)) || optimize || in_lto_p)
1736 /* This is a PARM_DECL or RESULT_DECL. For those partitions that
1737 contain the default def (representing the parm or result itself)
1738 we don't do anything here. But those which don't contain the
1739 default def (representing a temporary based on the parm/result)
1740 we need to allocate space just like for normal VAR_DECLs. */
1741 if (!bitmap_bit_p (SA.partition_has_default_def, i))
1743 expand_one_var (var, true, true);
1744 gcc_assert (SA.partition_to_pseudo[i]);
1749 if (flag_stack_protect == SPCT_FLAG_STRONG)
1750 gen_stack_protect_signal
1751 = stack_protect_decl_p () || stack_protect_return_slot_p ();
1753 /* At this point all variables on the local_decls with TREE_USED
1754 set are not associated with any block scope. Lay them out. */
1756 len = vec_safe_length (cfun->local_decls);
1757 FOR_EACH_LOCAL_DECL (cfun, i, var)
1759 bool expand_now = false;
1761 /* Expanded above already. */
1762 if (is_gimple_reg (var))
1764 TREE_USED (var) = 0;
1765 goto next;
1767 /* We didn't set a block for static or extern because it's hard
1768 to tell the difference between a global variable (re)declared
1769 in a local scope, and one that's really declared there to
1770 begin with. And it doesn't really matter much, since we're
1771 not giving them stack space. Expand them now. */
1772 else if (TREE_STATIC (var) || DECL_EXTERNAL (var))
1773 expand_now = true;
1775 /* Expand variables not associated with any block now. Those created by
1776 the optimizers could be live anywhere in the function. Those that
1777 could possibly have been scoped originally and detached from their
1778 block will have their allocation deferred so we coalesce them with
1779 others when optimization is enabled. */
1780 else if (TREE_USED (var))
1781 expand_now = true;
1783 /* Finally, mark all variables on the list as used. We'll use
1784 this in a moment when we expand those associated with scopes. */
1785 TREE_USED (var) = 1;
1787 if (expand_now)
1788 expand_one_var (var, true, true);
1790 next:
1791 if (DECL_ARTIFICIAL (var) && !DECL_IGNORED_P (var))
1793 rtx rtl = DECL_RTL_IF_SET (var);
1795 /* Keep artificial non-ignored vars in cfun->local_decls
1796 chain until instantiate_decls. */
1797 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
1798 add_local_decl (cfun, var);
1799 else if (rtl == NULL_RTX)
1800 /* If rtl isn't set yet, which can happen e.g. with
1801 -fstack-protector, retry before returning from this
1802 function. */
1803 maybe_local_decls.safe_push (var);
1807 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
1809 +-----------------+-----------------+
1810 | ...processed... | ...duplicates...|
1811 +-----------------+-----------------+
1813 +-- LEN points here.
1815 We just want the duplicates, as those are the artificial
1816 non-ignored vars that we want to keep until instantiate_decls.
1817 Move them down and truncate the array. */
1818 if (!vec_safe_is_empty (cfun->local_decls))
1819 cfun->local_decls->block_remove (0, len);
1821 /* At this point, all variables within the block tree with TREE_USED
1822 set are actually used by the optimized function. Lay them out. */
1823 expand_used_vars_for_block (outer_block, true);
1825 if (stack_vars_num > 0)
1827 add_scope_conflicts ();
1829 /* If stack protection is enabled, we don't share space between
1830 vulnerable data and non-vulnerable data. */
1831 if (flag_stack_protect)
1832 add_stack_protection_conflicts ();
1834 /* Now that we have collected all stack variables, and have computed a
1835 minimal interference graph, attempt to save some stack space. */
1836 partition_stack_vars ();
1837 if (dump_file)
1838 dump_stack_var_partition ();
1841 switch (flag_stack_protect)
1843 case SPCT_FLAG_ALL:
1844 create_stack_guard ();
1845 break;
1847 case SPCT_FLAG_STRONG:
1848 if (gen_stack_protect_signal
1849 || cfun->calls_alloca || has_protected_decls)
1850 create_stack_guard ();
1851 break;
1853 case SPCT_FLAG_DEFAULT:
1854 if (cfun->calls_alloca || has_protected_decls)
1855 create_stack_guard ();
1856 break;
1858 default:
1862 /* Assign rtl to each variable based on these partitions. */
1863 if (stack_vars_num > 0)
1865 struct stack_vars_data data;
1867 data.asan_vec = vNULL;
1868 data.asan_decl_vec = vNULL;
1869 data.asan_base = NULL_RTX;
1870 data.asan_alignb = 0;
1872 /* Reorder decls to be protected by iterating over the variables
1873 array multiple times, and allocating out of each phase in turn. */
1874 /* ??? We could probably integrate this into the qsort we did
1875 earlier, such that we naturally see these variables first,
1876 and thus naturally allocate things in the right order. */
1877 if (has_protected_decls)
1879 /* Phase 1 contains only character arrays. */
1880 expand_stack_vars (stack_protect_decl_phase_1, &data);
1882 /* Phase 2 contains other kinds of arrays. */
1883 if (flag_stack_protect == 2)
1884 expand_stack_vars (stack_protect_decl_phase_2, &data);
1887 if ((flag_sanitize & SANITIZE_ADDRESS) && ASAN_STACK)
1888 /* Phase 3, any partitions that need asan protection
1889 in addition to phase 1 and 2. */
1890 expand_stack_vars (asan_decl_phase_3, &data);
1892 if (!data.asan_vec.is_empty ())
1894 HOST_WIDE_INT prev_offset = frame_offset;
1895 HOST_WIDE_INT offset, sz, redzonesz;
1896 redzonesz = ASAN_RED_ZONE_SIZE;
1897 sz = data.asan_vec[0] - prev_offset;
1898 if (data.asan_alignb > ASAN_RED_ZONE_SIZE
1899 && data.asan_alignb <= 4096
1900 && sz + ASAN_RED_ZONE_SIZE >= (int) data.asan_alignb)
1901 redzonesz = ((sz + ASAN_RED_ZONE_SIZE + data.asan_alignb - 1)
1902 & ~(data.asan_alignb - HOST_WIDE_INT_1)) - sz;
1903 offset
1904 = alloc_stack_frame_space (redzonesz, ASAN_RED_ZONE_SIZE);
1905 data.asan_vec.safe_push (prev_offset);
1906 data.asan_vec.safe_push (offset);
1907 /* Leave space for alignment if STRICT_ALIGNMENT. */
1908 if (STRICT_ALIGNMENT)
1909 alloc_stack_frame_space ((GET_MODE_ALIGNMENT (SImode)
1910 << ASAN_SHADOW_SHIFT)
1911 / BITS_PER_UNIT, 1);
1913 var_end_seq
1914 = asan_emit_stack_protection (virtual_stack_vars_rtx,
1915 data.asan_base,
1916 data.asan_alignb,
1917 data.asan_vec.address (),
1918 data.asan_decl_vec.address (),
1919 data.asan_vec.length ());
1922 expand_stack_vars (NULL, &data);
1924 data.asan_vec.release ();
1925 data.asan_decl_vec.release ();
1928 fini_vars_expansion ();
1930 /* If there were any artificial non-ignored vars without rtl
1931 found earlier, see if deferred stack allocation hasn't assigned
1932 rtl to them. */
1933 FOR_EACH_VEC_ELT_REVERSE (maybe_local_decls, i, var)
1935 rtx rtl = DECL_RTL_IF_SET (var);
1937 /* Keep artificial non-ignored vars in cfun->local_decls
1938 chain until instantiate_decls. */
1939 if (rtl && (MEM_P (rtl) || GET_CODE (rtl) == CONCAT))
1940 add_local_decl (cfun, var);
1942 maybe_local_decls.release ();
1944 /* If the target requires that FRAME_OFFSET be aligned, do it. */
1945 if (STACK_ALIGNMENT_NEEDED)
1947 HOST_WIDE_INT align = PREFERRED_STACK_BOUNDARY / BITS_PER_UNIT;
1948 if (!FRAME_GROWS_DOWNWARD)
1949 frame_offset += align - 1;
1950 frame_offset &= -align;
1953 return var_end_seq;
1957 /* If we need to produce a detailed dump, print the tree representation
1958 for STMT to the dump file. SINCE is the last RTX after which the RTL
1959 generated for STMT should have been appended. */
1961 static void
1962 maybe_dump_rtl_for_gimple_stmt (gimple stmt, rtx_insn *since)
1964 if (dump_file && (dump_flags & TDF_DETAILS))
1966 fprintf (dump_file, "\n;; ");
1967 print_gimple_stmt (dump_file, stmt, 0,
1968 TDF_SLIM | (dump_flags & TDF_LINENO));
1969 fprintf (dump_file, "\n");
1971 print_rtl (dump_file, since ? NEXT_INSN (since) : since);
1975 /* Maps the blocks that do not contain tree labels to rtx labels. */
1977 static hash_map<basic_block, rtx_code_label *> *lab_rtx_for_bb;
1979 /* Returns the label_rtx expression for a label starting basic block BB. */
1981 static rtx
1982 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED)
1984 gimple_stmt_iterator gsi;
1985 tree lab;
1986 gimple lab_stmt;
1988 if (bb->flags & BB_RTL)
1989 return block_label (bb);
1991 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
1992 if (elt)
1993 return *elt;
1995 /* Find the tree label if it is present. */
1997 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1999 lab_stmt = gsi_stmt (gsi);
2000 if (gimple_code (lab_stmt) != GIMPLE_LABEL)
2001 break;
2003 lab = gimple_label_label (lab_stmt);
2004 if (DECL_NONLOCAL (lab))
2005 break;
2007 return label_rtx (lab);
2010 rtx_code_label *l = gen_label_rtx ();
2011 lab_rtx_for_bb->put (bb, l);
2012 return l;
2016 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
2017 of a basic block where we just expanded the conditional at the end,
2018 possibly clean up the CFG and instruction sequence. LAST is the
2019 last instruction before the just emitted jump sequence. */
2021 static void
2022 maybe_cleanup_end_of_block (edge e, rtx_insn *last)
2024 /* Special case: when jumpif decides that the condition is
2025 trivial it emits an unconditional jump (and the necessary
2026 barrier). But we still have two edges, the fallthru one is
2027 wrong. purge_dead_edges would clean this up later. Unfortunately
2028 we have to insert insns (and split edges) before
2029 find_many_sub_basic_blocks and hence before purge_dead_edges.
2030 But splitting edges might create new blocks which depend on the
2031 fact that if there are two edges there's no barrier. So the
2032 barrier would get lost and verify_flow_info would ICE. Instead
2033 of auditing all edge splitters to care for the barrier (which
2034 normally isn't there in a cleaned CFG), fix it here. */
2035 if (BARRIER_P (get_last_insn ()))
2037 rtx_insn *insn;
2038 remove_edge (e);
2039 /* Now, we have a single successor block, if we have insns to
2040 insert on the remaining edge we potentially will insert
2041 it at the end of this block (if the dest block isn't feasible)
2042 in order to avoid splitting the edge. This insertion will take
2043 place in front of the last jump. But we might have emitted
2044 multiple jumps (conditional and one unconditional) to the
2045 same destination. Inserting in front of the last one then
2046 is a problem. See PR 40021. We fix this by deleting all
2047 jumps except the last unconditional one. */
2048 insn = PREV_INSN (get_last_insn ());
2049 /* Make sure we have an unconditional jump. Otherwise we're
2050 confused. */
2051 gcc_assert (JUMP_P (insn) && !any_condjump_p (insn));
2052 for (insn = PREV_INSN (insn); insn != last;)
2054 insn = PREV_INSN (insn);
2055 if (JUMP_P (NEXT_INSN (insn)))
2057 if (!any_condjump_p (NEXT_INSN (insn)))
2059 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn))));
2060 delete_insn (NEXT_INSN (NEXT_INSN (insn)));
2062 delete_insn (NEXT_INSN (insn));
2068 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
2069 Returns a new basic block if we've terminated the current basic
2070 block and created a new one. */
2072 static basic_block
2073 expand_gimple_cond (basic_block bb, gimple stmt)
2075 basic_block new_bb, dest;
2076 edge new_edge;
2077 edge true_edge;
2078 edge false_edge;
2079 rtx_insn *last2, *last;
2080 enum tree_code code;
2081 tree op0, op1;
2083 code = gimple_cond_code (stmt);
2084 op0 = gimple_cond_lhs (stmt);
2085 op1 = gimple_cond_rhs (stmt);
2086 /* We're sometimes presented with such code:
2087 D.123_1 = x < y;
2088 if (D.123_1 != 0)
2090 This would expand to two comparisons which then later might
2091 be cleaned up by combine. But some pattern matchers like if-conversion
2092 work better when there's only one compare, so make up for this
2093 here as special exception if TER would have made the same change. */
2094 if (SA.values
2095 && TREE_CODE (op0) == SSA_NAME
2096 && TREE_CODE (TREE_TYPE (op0)) == BOOLEAN_TYPE
2097 && TREE_CODE (op1) == INTEGER_CST
2098 && ((gimple_cond_code (stmt) == NE_EXPR
2099 && integer_zerop (op1))
2100 || (gimple_cond_code (stmt) == EQ_EXPR
2101 && integer_onep (op1)))
2102 && bitmap_bit_p (SA.values, SSA_NAME_VERSION (op0)))
2104 gimple second = SSA_NAME_DEF_STMT (op0);
2105 if (gimple_code (second) == GIMPLE_ASSIGN)
2107 enum tree_code code2 = gimple_assign_rhs_code (second);
2108 if (TREE_CODE_CLASS (code2) == tcc_comparison)
2110 code = code2;
2111 op0 = gimple_assign_rhs1 (second);
2112 op1 = gimple_assign_rhs2 (second);
2114 /* If jumps are cheap turn some more codes into
2115 jumpy sequences. */
2116 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4)
2118 if ((code2 == BIT_AND_EXPR
2119 && TYPE_PRECISION (TREE_TYPE (op0)) == 1
2120 && TREE_CODE (gimple_assign_rhs2 (second)) != INTEGER_CST)
2121 || code2 == TRUTH_AND_EXPR)
2123 code = TRUTH_ANDIF_EXPR;
2124 op0 = gimple_assign_rhs1 (second);
2125 op1 = gimple_assign_rhs2 (second);
2127 else if (code2 == BIT_IOR_EXPR || code2 == TRUTH_OR_EXPR)
2129 code = TRUTH_ORIF_EXPR;
2130 op0 = gimple_assign_rhs1 (second);
2131 op1 = gimple_assign_rhs2 (second);
2137 last2 = last = get_last_insn ();
2139 extract_true_false_edges_from_block (bb, &true_edge, &false_edge);
2140 set_curr_insn_location (gimple_location (stmt));
2142 /* These flags have no purpose in RTL land. */
2143 true_edge->flags &= ~EDGE_TRUE_VALUE;
2144 false_edge->flags &= ~EDGE_FALSE_VALUE;
2146 /* We can either have a pure conditional jump with one fallthru edge or
2147 two-way jump that needs to be decomposed into two basic blocks. */
2148 if (false_edge->dest == bb->next_bb)
2150 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2151 true_edge->probability);
2152 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2153 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2154 set_curr_insn_location (true_edge->goto_locus);
2155 false_edge->flags |= EDGE_FALLTHRU;
2156 maybe_cleanup_end_of_block (false_edge, last);
2157 return NULL;
2159 if (true_edge->dest == bb->next_bb)
2161 jumpifnot_1 (code, op0, op1, label_rtx_for_bb (false_edge->dest),
2162 false_edge->probability);
2163 maybe_dump_rtl_for_gimple_stmt (stmt, last);
2164 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2165 set_curr_insn_location (false_edge->goto_locus);
2166 true_edge->flags |= EDGE_FALLTHRU;
2167 maybe_cleanup_end_of_block (true_edge, last);
2168 return NULL;
2171 jumpif_1 (code, op0, op1, label_rtx_for_bb (true_edge->dest),
2172 true_edge->probability);
2173 last = get_last_insn ();
2174 if (false_edge->goto_locus != UNKNOWN_LOCATION)
2175 set_curr_insn_location (false_edge->goto_locus);
2176 emit_jump (label_rtx_for_bb (false_edge->dest));
2178 BB_END (bb) = last;
2179 if (BARRIER_P (BB_END (bb)))
2180 BB_END (bb) = PREV_INSN (BB_END (bb));
2181 update_bb_for_insn (bb);
2183 new_bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
2184 dest = false_edge->dest;
2185 redirect_edge_succ (false_edge, new_bb);
2186 false_edge->flags |= EDGE_FALLTHRU;
2187 new_bb->count = false_edge->count;
2188 new_bb->frequency = EDGE_FREQUENCY (false_edge);
2189 add_bb_to_loop (new_bb, bb->loop_father);
2190 new_edge = make_edge (new_bb, dest, 0);
2191 new_edge->probability = REG_BR_PROB_BASE;
2192 new_edge->count = new_bb->count;
2193 if (BARRIER_P (BB_END (new_bb)))
2194 BB_END (new_bb) = PREV_INSN (BB_END (new_bb));
2195 update_bb_for_insn (new_bb);
2197 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
2199 if (true_edge->goto_locus != UNKNOWN_LOCATION)
2201 set_curr_insn_location (true_edge->goto_locus);
2202 true_edge->goto_locus = curr_insn_location ();
2205 return new_bb;
2208 /* Mark all calls that can have a transaction restart. */
2210 static void
2211 mark_transaction_restart_calls (gimple stmt)
2213 struct tm_restart_node dummy;
2214 void **slot;
2216 if (!cfun->gimple_df->tm_restart)
2217 return;
2219 dummy.stmt = stmt;
2220 slot = htab_find_slot (cfun->gimple_df->tm_restart, &dummy, NO_INSERT);
2221 if (slot)
2223 struct tm_restart_node *n = (struct tm_restart_node *) *slot;
2224 tree list = n->label_or_list;
2225 rtx_insn *insn;
2227 for (insn = next_real_insn (get_last_insn ());
2228 !CALL_P (insn);
2229 insn = next_real_insn (insn))
2230 continue;
2232 if (TREE_CODE (list) == LABEL_DECL)
2233 add_reg_note (insn, REG_TM, label_rtx (list));
2234 else
2235 for (; list ; list = TREE_CHAIN (list))
2236 add_reg_note (insn, REG_TM, label_rtx (TREE_VALUE (list)));
2240 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
2241 statement STMT. */
2243 static void
2244 expand_call_stmt (gimple stmt)
2246 tree exp, decl, lhs;
2247 bool builtin_p;
2248 size_t i;
2250 if (gimple_call_internal_p (stmt))
2252 expand_internal_call (stmt);
2253 return;
2256 exp = build_vl_exp (CALL_EXPR, gimple_call_num_args (stmt) + 3);
2258 CALL_EXPR_FN (exp) = gimple_call_fn (stmt);
2259 decl = gimple_call_fndecl (stmt);
2260 builtin_p = decl && DECL_BUILT_IN (decl);
2262 /* If this is not a builtin function, the function type through which the
2263 call is made may be different from the type of the function. */
2264 if (!builtin_p)
2265 CALL_EXPR_FN (exp)
2266 = fold_convert (build_pointer_type (gimple_call_fntype (stmt)),
2267 CALL_EXPR_FN (exp));
2269 TREE_TYPE (exp) = gimple_call_return_type (stmt);
2270 CALL_EXPR_STATIC_CHAIN (exp) = gimple_call_chain (stmt);
2272 for (i = 0; i < gimple_call_num_args (stmt); i++)
2274 tree arg = gimple_call_arg (stmt, i);
2275 gimple def;
2276 /* TER addresses into arguments of builtin functions so we have a
2277 chance to infer more correct alignment information. See PR39954. */
2278 if (builtin_p
2279 && TREE_CODE (arg) == SSA_NAME
2280 && (def = get_gimple_for_ssa_name (arg))
2281 && gimple_assign_rhs_code (def) == ADDR_EXPR)
2282 arg = gimple_assign_rhs1 (def);
2283 CALL_EXPR_ARG (exp, i) = arg;
2286 if (gimple_has_side_effects (stmt))
2287 TREE_SIDE_EFFECTS (exp) = 1;
2289 if (gimple_call_nothrow_p (stmt))
2290 TREE_NOTHROW (exp) = 1;
2292 CALL_EXPR_TAILCALL (exp) = gimple_call_tail_p (stmt);
2293 CALL_EXPR_RETURN_SLOT_OPT (exp) = gimple_call_return_slot_opt_p (stmt);
2294 if (decl
2295 && DECL_BUILT_IN_CLASS (decl) == BUILT_IN_NORMAL
2296 && (DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA
2297 || DECL_FUNCTION_CODE (decl) == BUILT_IN_ALLOCA_WITH_ALIGN))
2298 CALL_ALLOCA_FOR_VAR_P (exp) = gimple_call_alloca_for_var_p (stmt);
2299 else
2300 CALL_FROM_THUNK_P (exp) = gimple_call_from_thunk_p (stmt);
2301 CALL_EXPR_VA_ARG_PACK (exp) = gimple_call_va_arg_pack_p (stmt);
2302 SET_EXPR_LOCATION (exp, gimple_location (stmt));
2304 /* Ensure RTL is created for debug args. */
2305 if (decl && DECL_HAS_DEBUG_ARGS_P (decl))
2307 vec<tree, va_gc> **debug_args = decl_debug_args_lookup (decl);
2308 unsigned int ix;
2309 tree dtemp;
2311 if (debug_args)
2312 for (ix = 1; (*debug_args)->iterate (ix, &dtemp); ix += 2)
2314 gcc_assert (TREE_CODE (dtemp) == DEBUG_EXPR_DECL);
2315 expand_debug_expr (dtemp);
2319 lhs = gimple_call_lhs (stmt);
2320 if (lhs)
2321 expand_assignment (lhs, exp, false);
2322 else
2323 expand_expr (exp, const0_rtx, VOIDmode, EXPAND_NORMAL);
2325 mark_transaction_restart_calls (stmt);
2329 /* Generate RTL for an asm statement (explicit assembler code).
2330 STRING is a STRING_CST node containing the assembler code text,
2331 or an ADDR_EXPR containing a STRING_CST. VOL nonzero means the
2332 insn is volatile; don't optimize it. */
2334 static void
2335 expand_asm_loc (tree string, int vol, location_t locus)
2337 rtx body;
2339 if (TREE_CODE (string) == ADDR_EXPR)
2340 string = TREE_OPERAND (string, 0);
2342 body = gen_rtx_ASM_INPUT_loc (VOIDmode,
2343 ggc_strdup (TREE_STRING_POINTER (string)),
2344 locus);
2346 MEM_VOLATILE_P (body) = vol;
2348 emit_insn (body);
2351 /* Return the number of times character C occurs in string S. */
2352 static int
2353 n_occurrences (int c, const char *s)
2355 int n = 0;
2356 while (*s)
2357 n += (*s++ == c);
2358 return n;
2361 /* A subroutine of expand_asm_operands. Check that all operands have
2362 the same number of alternatives. Return true if so. */
2364 static bool
2365 check_operand_nalternatives (tree outputs, tree inputs)
2367 if (outputs || inputs)
2369 tree tmp = TREE_PURPOSE (outputs ? outputs : inputs);
2370 int nalternatives
2371 = n_occurrences (',', TREE_STRING_POINTER (TREE_VALUE (tmp)));
2372 tree next = inputs;
2374 if (nalternatives + 1 > MAX_RECOG_ALTERNATIVES)
2376 error ("too many alternatives in %<asm%>");
2377 return false;
2380 tmp = outputs;
2381 while (tmp)
2383 const char *constraint
2384 = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (tmp)));
2386 if (n_occurrences (',', constraint) != nalternatives)
2388 error ("operand constraints for %<asm%> differ "
2389 "in number of alternatives");
2390 return false;
2393 if (TREE_CHAIN (tmp))
2394 tmp = TREE_CHAIN (tmp);
2395 else
2396 tmp = next, next = 0;
2400 return true;
2403 /* Check for overlap between registers marked in CLOBBERED_REGS and
2404 anything inappropriate in T. Emit error and return the register
2405 variable definition for error, NULL_TREE for ok. */
2407 static bool
2408 tree_conflicts_with_clobbers_p (tree t, HARD_REG_SET *clobbered_regs)
2410 /* Conflicts between asm-declared register variables and the clobber
2411 list are not allowed. */
2412 tree overlap = tree_overlaps_hard_reg_set (t, clobbered_regs);
2414 if (overlap)
2416 error ("asm-specifier for variable %qE conflicts with asm clobber list",
2417 DECL_NAME (overlap));
2419 /* Reset registerness to stop multiple errors emitted for a single
2420 variable. */
2421 DECL_REGISTER (overlap) = 0;
2422 return true;
2425 return false;
2428 /* Generate RTL for an asm statement with arguments.
2429 STRING is the instruction template.
2430 OUTPUTS is a list of output arguments (lvalues); INPUTS a list of inputs.
2431 Each output or input has an expression in the TREE_VALUE and
2432 a tree list in TREE_PURPOSE which in turn contains a constraint
2433 name in TREE_VALUE (or NULL_TREE) and a constraint string
2434 in TREE_PURPOSE.
2435 CLOBBERS is a list of STRING_CST nodes each naming a hard register
2436 that is clobbered by this insn.
2438 LABELS is a list of labels, and if LABELS is non-NULL, FALLTHRU_BB
2439 should be the fallthru basic block of the asm goto.
2441 Not all kinds of lvalue that may appear in OUTPUTS can be stored directly.
2442 Some elements of OUTPUTS may be replaced with trees representing temporary
2443 values. The caller should copy those temporary values to the originally
2444 specified lvalues.
2446 VOL nonzero means the insn is volatile; don't optimize it. */
2448 static void
2449 expand_asm_operands (tree string, tree outputs, tree inputs,
2450 tree clobbers, tree labels, basic_block fallthru_bb,
2451 int vol, location_t locus)
2453 rtvec argvec, constraintvec, labelvec;
2454 rtx body;
2455 int ninputs = list_length (inputs);
2456 int noutputs = list_length (outputs);
2457 int nlabels = list_length (labels);
2458 int ninout;
2459 int nclobbers;
2460 HARD_REG_SET clobbered_regs;
2461 int clobber_conflict_found = 0;
2462 tree tail;
2463 tree t;
2464 int i;
2465 /* Vector of RTX's of evaluated output operands. */
2466 rtx *output_rtx = XALLOCAVEC (rtx, noutputs);
2467 int *inout_opnum = XALLOCAVEC (int, noutputs);
2468 rtx *real_output_rtx = XALLOCAVEC (rtx, noutputs);
2469 enum machine_mode *inout_mode = XALLOCAVEC (enum machine_mode, noutputs);
2470 const char **constraints = XALLOCAVEC (const char *, noutputs + ninputs);
2471 int old_generating_concat_p = generating_concat_p;
2472 rtx_code_label *fallthru_label = NULL;
2474 /* An ASM with no outputs needs to be treated as volatile, for now. */
2475 if (noutputs == 0)
2476 vol = 1;
2478 if (! check_operand_nalternatives (outputs, inputs))
2479 return;
2481 string = resolve_asm_operand_names (string, outputs, inputs, labels);
2483 /* Collect constraints. */
2484 i = 0;
2485 for (t = outputs; t ; t = TREE_CHAIN (t), i++)
2486 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2487 for (t = inputs; t ; t = TREE_CHAIN (t), i++)
2488 constraints[i] = TREE_STRING_POINTER (TREE_VALUE (TREE_PURPOSE (t)));
2490 /* Sometimes we wish to automatically clobber registers across an asm.
2491 Case in point is when the i386 backend moved from cc0 to a hard reg --
2492 maintaining source-level compatibility means automatically clobbering
2493 the flags register. */
2494 clobbers = targetm.md_asm_clobbers (outputs, inputs, clobbers);
2496 /* Count the number of meaningful clobbered registers, ignoring what
2497 we would ignore later. */
2498 nclobbers = 0;
2499 CLEAR_HARD_REG_SET (clobbered_regs);
2500 for (tail = clobbers; tail; tail = TREE_CHAIN (tail))
2502 const char *regname;
2503 int nregs;
2505 if (TREE_VALUE (tail) == error_mark_node)
2506 return;
2507 regname = TREE_STRING_POINTER (TREE_VALUE (tail));
2509 i = decode_reg_name_and_count (regname, &nregs);
2510 if (i == -4)
2511 ++nclobbers;
2512 else if (i == -2)
2513 error ("unknown register name %qs in %<asm%>", regname);
2515 /* Mark clobbered registers. */
2516 if (i >= 0)
2518 int reg;
2520 for (reg = i; reg < i + nregs; reg++)
2522 ++nclobbers;
2524 /* Clobbering the PIC register is an error. */
2525 if (reg == (int) PIC_OFFSET_TABLE_REGNUM)
2527 error ("PIC register clobbered by %qs in %<asm%>", regname);
2528 return;
2531 SET_HARD_REG_BIT (clobbered_regs, reg);
2536 /* First pass over inputs and outputs checks validity and sets
2537 mark_addressable if needed. */
2539 ninout = 0;
2540 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
2542 tree val = TREE_VALUE (tail);
2543 tree type = TREE_TYPE (val);
2544 const char *constraint;
2545 bool is_inout;
2546 bool allows_reg;
2547 bool allows_mem;
2549 /* If there's an erroneous arg, emit no insn. */
2550 if (type == error_mark_node)
2551 return;
2553 /* Try to parse the output constraint. If that fails, there's
2554 no point in going further. */
2555 constraint = constraints[i];
2556 if (!parse_output_constraint (&constraint, i, ninputs, noutputs,
2557 &allows_mem, &allows_reg, &is_inout))
2558 return;
2560 if (! allows_reg
2561 && (allows_mem
2562 || is_inout
2563 || (DECL_P (val)
2564 && REG_P (DECL_RTL (val))
2565 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type))))
2566 mark_addressable (val);
2568 if (is_inout)
2569 ninout++;
2572 ninputs += ninout;
2573 if (ninputs + noutputs > MAX_RECOG_OPERANDS)
2575 error ("more than %d operands in %<asm%>", MAX_RECOG_OPERANDS);
2576 return;
2579 for (i = 0, tail = inputs; tail; i++, tail = TREE_CHAIN (tail))
2581 bool allows_reg, allows_mem;
2582 const char *constraint;
2584 /* If there's an erroneous arg, emit no insn, because the ASM_INPUT
2585 would get VOIDmode and that could cause a crash in reload. */
2586 if (TREE_TYPE (TREE_VALUE (tail)) == error_mark_node)
2587 return;
2589 constraint = constraints[i + noutputs];
2590 if (! parse_input_constraint (&constraint, i, ninputs, noutputs, ninout,
2591 constraints, &allows_mem, &allows_reg))
2592 return;
2594 if (! allows_reg && allows_mem)
2595 mark_addressable (TREE_VALUE (tail));
2598 /* Second pass evaluates arguments. */
2600 /* Make sure stack is consistent for asm goto. */
2601 if (nlabels > 0)
2602 do_pending_stack_adjust ();
2604 ninout = 0;
2605 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
2607 tree val = TREE_VALUE (tail);
2608 tree type = TREE_TYPE (val);
2609 bool is_inout;
2610 bool allows_reg;
2611 bool allows_mem;
2612 rtx op;
2613 bool ok;
2615 ok = parse_output_constraint (&constraints[i], i, ninputs,
2616 noutputs, &allows_mem, &allows_reg,
2617 &is_inout);
2618 gcc_assert (ok);
2620 /* If an output operand is not a decl or indirect ref and our constraint
2621 allows a register, make a temporary to act as an intermediate.
2622 Make the asm insn write into that, then our caller will copy it to
2623 the real output operand. Likewise for promoted variables. */
2625 generating_concat_p = 0;
2627 real_output_rtx[i] = NULL_RTX;
2628 if ((TREE_CODE (val) == INDIRECT_REF
2629 && allows_mem)
2630 || (DECL_P (val)
2631 && (allows_mem || REG_P (DECL_RTL (val)))
2632 && ! (REG_P (DECL_RTL (val))
2633 && GET_MODE (DECL_RTL (val)) != TYPE_MODE (type)))
2634 || ! allows_reg
2635 || is_inout)
2637 op = expand_expr (val, NULL_RTX, VOIDmode,
2638 !allows_reg ? EXPAND_MEMORY : EXPAND_WRITE);
2639 if (MEM_P (op))
2640 op = validize_mem (op);
2642 if (! allows_reg && !MEM_P (op))
2643 error ("output number %d not directly addressable", i);
2644 if ((! allows_mem && MEM_P (op))
2645 || GET_CODE (op) == CONCAT)
2647 real_output_rtx[i] = op;
2648 op = gen_reg_rtx (GET_MODE (op));
2649 if (is_inout)
2650 emit_move_insn (op, real_output_rtx[i]);
2653 else
2655 op = assign_temp (type, 0, 1);
2656 op = validize_mem (op);
2657 if (!MEM_P (op) && TREE_CODE (TREE_VALUE (tail)) == SSA_NAME)
2658 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (TREE_VALUE (tail)), op);
2659 TREE_VALUE (tail) = make_tree (type, op);
2661 output_rtx[i] = op;
2663 generating_concat_p = old_generating_concat_p;
2665 if (is_inout)
2667 inout_mode[ninout] = TYPE_MODE (type);
2668 inout_opnum[ninout++] = i;
2671 if (tree_conflicts_with_clobbers_p (val, &clobbered_regs))
2672 clobber_conflict_found = 1;
2675 /* Make vectors for the expression-rtx, constraint strings,
2676 and named operands. */
2678 argvec = rtvec_alloc (ninputs);
2679 constraintvec = rtvec_alloc (ninputs);
2680 labelvec = rtvec_alloc (nlabels);
2682 body = gen_rtx_ASM_OPERANDS ((noutputs == 0 ? VOIDmode
2683 : GET_MODE (output_rtx[0])),
2684 ggc_strdup (TREE_STRING_POINTER (string)),
2685 empty_string, 0, argvec, constraintvec,
2686 labelvec, locus);
2688 MEM_VOLATILE_P (body) = vol;
2690 /* Eval the inputs and put them into ARGVEC.
2691 Put their constraints into ASM_INPUTs and store in CONSTRAINTS. */
2693 for (i = 0, tail = inputs; tail; tail = TREE_CHAIN (tail), ++i)
2695 bool allows_reg, allows_mem;
2696 const char *constraint;
2697 tree val, type;
2698 rtx op;
2699 bool ok;
2701 constraint = constraints[i + noutputs];
2702 ok = parse_input_constraint (&constraint, i, ninputs, noutputs, ninout,
2703 constraints, &allows_mem, &allows_reg);
2704 gcc_assert (ok);
2706 generating_concat_p = 0;
2708 val = TREE_VALUE (tail);
2709 type = TREE_TYPE (val);
2710 /* EXPAND_INITIALIZER will not generate code for valid initializer
2711 constants, but will still generate code for other types of operand.
2712 This is the behavior we want for constant constraints. */
2713 op = expand_expr (val, NULL_RTX, VOIDmode,
2714 allows_reg ? EXPAND_NORMAL
2715 : allows_mem ? EXPAND_MEMORY
2716 : EXPAND_INITIALIZER);
2718 /* Never pass a CONCAT to an ASM. */
2719 if (GET_CODE (op) == CONCAT)
2720 op = force_reg (GET_MODE (op), op);
2721 else if (MEM_P (op))
2722 op = validize_mem (op);
2724 if (asm_operand_ok (op, constraint, NULL) <= 0)
2726 if (allows_reg && TYPE_MODE (type) != BLKmode)
2727 op = force_reg (TYPE_MODE (type), op);
2728 else if (!allows_mem)
2729 warning (0, "asm operand %d probably doesn%'t match constraints",
2730 i + noutputs);
2731 else if (MEM_P (op))
2733 /* We won't recognize either volatile memory or memory
2734 with a queued address as available a memory_operand
2735 at this point. Ignore it: clearly this *is* a memory. */
2737 else
2738 gcc_unreachable ();
2741 generating_concat_p = old_generating_concat_p;
2742 ASM_OPERANDS_INPUT (body, i) = op;
2744 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, i)
2745 = gen_rtx_ASM_INPUT_loc (TYPE_MODE (type),
2746 ggc_strdup (constraints[i + noutputs]),
2747 locus);
2749 if (tree_conflicts_with_clobbers_p (val, &clobbered_regs))
2750 clobber_conflict_found = 1;
2753 /* Protect all the operands from the queue now that they have all been
2754 evaluated. */
2756 generating_concat_p = 0;
2758 /* For in-out operands, copy output rtx to input rtx. */
2759 for (i = 0; i < ninout; i++)
2761 int j = inout_opnum[i];
2762 char buffer[16];
2764 ASM_OPERANDS_INPUT (body, ninputs - ninout + i)
2765 = output_rtx[j];
2767 sprintf (buffer, "%d", j);
2768 ASM_OPERANDS_INPUT_CONSTRAINT_EXP (body, ninputs - ninout + i)
2769 = gen_rtx_ASM_INPUT_loc (inout_mode[i], ggc_strdup (buffer), locus);
2772 /* Copy labels to the vector. */
2773 for (i = 0, tail = labels; i < nlabels; ++i, tail = TREE_CHAIN (tail))
2775 rtx r;
2776 /* If asm goto has any labels in the fallthru basic block, use
2777 a label that we emit immediately after the asm goto. Expansion
2778 may insert further instructions into the same basic block after
2779 asm goto and if we don't do this, insertion of instructions on
2780 the fallthru edge might misbehave. See PR58670. */
2781 if (fallthru_bb
2782 && label_to_block_fn (cfun, TREE_VALUE (tail)) == fallthru_bb)
2784 if (fallthru_label == NULL_RTX)
2785 fallthru_label = gen_label_rtx ();
2786 r = fallthru_label;
2788 else
2789 r = label_rtx (TREE_VALUE (tail));
2790 ASM_OPERANDS_LABEL (body, i) = gen_rtx_LABEL_REF (Pmode, r);
2793 generating_concat_p = old_generating_concat_p;
2795 /* Now, for each output, construct an rtx
2796 (set OUTPUT (asm_operands INSN OUTPUTCONSTRAINT OUTPUTNUMBER
2797 ARGVEC CONSTRAINTS OPNAMES))
2798 If there is more than one, put them inside a PARALLEL. */
2800 if (nlabels > 0 && nclobbers == 0)
2802 gcc_assert (noutputs == 0);
2803 emit_jump_insn (body);
2805 else if (noutputs == 0 && nclobbers == 0)
2807 /* No output operands: put in a raw ASM_OPERANDS rtx. */
2808 emit_insn (body);
2810 else if (noutputs == 1 && nclobbers == 0)
2812 ASM_OPERANDS_OUTPUT_CONSTRAINT (body) = ggc_strdup (constraints[0]);
2813 emit_insn (gen_rtx_SET (VOIDmode, output_rtx[0], body));
2815 else
2817 rtx obody = body;
2818 int num = noutputs;
2820 if (num == 0)
2821 num = 1;
2823 body = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num + nclobbers));
2825 /* For each output operand, store a SET. */
2826 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
2828 XVECEXP (body, 0, i)
2829 = gen_rtx_SET (VOIDmode,
2830 output_rtx[i],
2831 gen_rtx_ASM_OPERANDS
2832 (GET_MODE (output_rtx[i]),
2833 ggc_strdup (TREE_STRING_POINTER (string)),
2834 ggc_strdup (constraints[i]),
2835 i, argvec, constraintvec, labelvec, locus));
2837 MEM_VOLATILE_P (SET_SRC (XVECEXP (body, 0, i))) = vol;
2840 /* If there are no outputs (but there are some clobbers)
2841 store the bare ASM_OPERANDS into the PARALLEL. */
2843 if (i == 0)
2844 XVECEXP (body, 0, i++) = obody;
2846 /* Store (clobber REG) for each clobbered register specified. */
2848 for (tail = clobbers; tail; tail = TREE_CHAIN (tail))
2850 const char *regname = TREE_STRING_POINTER (TREE_VALUE (tail));
2851 int reg, nregs;
2852 int j = decode_reg_name_and_count (regname, &nregs);
2853 rtx clobbered_reg;
2855 if (j < 0)
2857 if (j == -3) /* `cc', which is not a register */
2858 continue;
2860 if (j == -4) /* `memory', don't cache memory across asm */
2862 XVECEXP (body, 0, i++)
2863 = gen_rtx_CLOBBER (VOIDmode,
2864 gen_rtx_MEM
2865 (BLKmode,
2866 gen_rtx_SCRATCH (VOIDmode)));
2867 continue;
2870 /* Ignore unknown register, error already signaled. */
2871 continue;
2874 for (reg = j; reg < j + nregs; reg++)
2876 /* Use QImode since that's guaranteed to clobber just
2877 * one reg. */
2878 clobbered_reg = gen_rtx_REG (QImode, reg);
2880 /* Do sanity check for overlap between clobbers and
2881 respectively input and outputs that hasn't been
2882 handled. Such overlap should have been detected and
2883 reported above. */
2884 if (!clobber_conflict_found)
2886 int opno;
2888 /* We test the old body (obody) contents to avoid
2889 tripping over the under-construction body. */
2890 for (opno = 0; opno < noutputs; opno++)
2891 if (reg_overlap_mentioned_p (clobbered_reg,
2892 output_rtx[opno]))
2893 internal_error
2894 ("asm clobber conflict with output operand");
2896 for (opno = 0; opno < ninputs - ninout; opno++)
2897 if (reg_overlap_mentioned_p (clobbered_reg,
2898 ASM_OPERANDS_INPUT (obody,
2899 opno)))
2900 internal_error
2901 ("asm clobber conflict with input operand");
2904 XVECEXP (body, 0, i++)
2905 = gen_rtx_CLOBBER (VOIDmode, clobbered_reg);
2909 if (nlabels > 0)
2910 emit_jump_insn (body);
2911 else
2912 emit_insn (body);
2915 if (fallthru_label)
2916 emit_label (fallthru_label);
2918 /* For any outputs that needed reloading into registers, spill them
2919 back to where they belong. */
2920 for (i = 0; i < noutputs; ++i)
2921 if (real_output_rtx[i])
2922 emit_move_insn (real_output_rtx[i], output_rtx[i]);
2924 crtl->has_asm_statement = 1;
2925 free_temp_slots ();
2929 static void
2930 expand_asm_stmt (gimple stmt)
2932 int noutputs;
2933 tree outputs, tail, t;
2934 tree *o;
2935 size_t i, n;
2936 const char *s;
2937 tree str, out, in, cl, labels;
2938 location_t locus = gimple_location (stmt);
2939 basic_block fallthru_bb = NULL;
2941 /* Meh... convert the gimple asm operands into real tree lists.
2942 Eventually we should make all routines work on the vectors instead
2943 of relying on TREE_CHAIN. */
2944 out = NULL_TREE;
2945 n = gimple_asm_noutputs (stmt);
2946 if (n > 0)
2948 t = out = gimple_asm_output_op (stmt, 0);
2949 for (i = 1; i < n; i++)
2950 t = TREE_CHAIN (t) = gimple_asm_output_op (stmt, i);
2953 in = NULL_TREE;
2954 n = gimple_asm_ninputs (stmt);
2955 if (n > 0)
2957 t = in = gimple_asm_input_op (stmt, 0);
2958 for (i = 1; i < n; i++)
2959 t = TREE_CHAIN (t) = gimple_asm_input_op (stmt, i);
2962 cl = NULL_TREE;
2963 n = gimple_asm_nclobbers (stmt);
2964 if (n > 0)
2966 t = cl = gimple_asm_clobber_op (stmt, 0);
2967 for (i = 1; i < n; i++)
2968 t = TREE_CHAIN (t) = gimple_asm_clobber_op (stmt, i);
2971 labels = NULL_TREE;
2972 n = gimple_asm_nlabels (stmt);
2973 if (n > 0)
2975 edge fallthru = find_fallthru_edge (gimple_bb (stmt)->succs);
2976 if (fallthru)
2977 fallthru_bb = fallthru->dest;
2978 t = labels = gimple_asm_label_op (stmt, 0);
2979 for (i = 1; i < n; i++)
2980 t = TREE_CHAIN (t) = gimple_asm_label_op (stmt, i);
2983 s = gimple_asm_string (stmt);
2984 str = build_string (strlen (s), s);
2986 if (gimple_asm_input_p (stmt))
2988 expand_asm_loc (str, gimple_asm_volatile_p (stmt), locus);
2989 return;
2992 outputs = out;
2993 noutputs = gimple_asm_noutputs (stmt);
2994 /* o[I] is the place that output number I should be written. */
2995 o = (tree *) alloca (noutputs * sizeof (tree));
2997 /* Record the contents of OUTPUTS before it is modified. */
2998 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
2999 o[i] = TREE_VALUE (tail);
3001 /* Generate the ASM_OPERANDS insn; store into the TREE_VALUEs of
3002 OUTPUTS some trees for where the values were actually stored. */
3003 expand_asm_operands (str, outputs, in, cl, labels, fallthru_bb,
3004 gimple_asm_volatile_p (stmt), locus);
3006 /* Copy all the intermediate outputs into the specified outputs. */
3007 for (i = 0, tail = outputs; tail; tail = TREE_CHAIN (tail), i++)
3009 if (o[i] != TREE_VALUE (tail))
3011 expand_assignment (o[i], TREE_VALUE (tail), false);
3012 free_temp_slots ();
3014 /* Restore the original value so that it's correct the next
3015 time we expand this function. */
3016 TREE_VALUE (tail) = o[i];
3021 /* Emit code to jump to the address
3022 specified by the pointer expression EXP. */
3024 static void
3025 expand_computed_goto (tree exp)
3027 rtx x = expand_normal (exp);
3029 x = convert_memory_address (Pmode, x);
3031 do_pending_stack_adjust ();
3032 emit_indirect_jump (x);
3035 /* Generate RTL code for a `goto' statement with target label LABEL.
3036 LABEL should be a LABEL_DECL tree node that was or will later be
3037 defined with `expand_label'. */
3039 static void
3040 expand_goto (tree label)
3042 #ifdef ENABLE_CHECKING
3043 /* Check for a nonlocal goto to a containing function. Should have
3044 gotten translated to __builtin_nonlocal_goto. */
3045 tree context = decl_function_context (label);
3046 gcc_assert (!context || context == current_function_decl);
3047 #endif
3049 emit_jump (label_rtx (label));
3052 /* Output a return with no value. */
3054 static void
3055 expand_null_return_1 (void)
3057 clear_pending_stack_adjust ();
3058 do_pending_stack_adjust ();
3059 emit_jump (return_label);
3062 /* Generate RTL to return from the current function, with no value.
3063 (That is, we do not do anything about returning any value.) */
3065 void
3066 expand_null_return (void)
3068 /* If this function was declared to return a value, but we
3069 didn't, clobber the return registers so that they are not
3070 propagated live to the rest of the function. */
3071 clobber_return_register ();
3073 expand_null_return_1 ();
3076 /* Generate RTL to return from the current function, with value VAL. */
3078 static void
3079 expand_value_return (rtx val)
3081 /* Copy the value to the return location unless it's already there. */
3083 tree decl = DECL_RESULT (current_function_decl);
3084 rtx return_reg = DECL_RTL (decl);
3085 if (return_reg != val)
3087 tree funtype = TREE_TYPE (current_function_decl);
3088 tree type = TREE_TYPE (decl);
3089 int unsignedp = TYPE_UNSIGNED (type);
3090 enum machine_mode old_mode = DECL_MODE (decl);
3091 enum machine_mode mode;
3092 if (DECL_BY_REFERENCE (decl))
3093 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 2);
3094 else
3095 mode = promote_function_mode (type, old_mode, &unsignedp, funtype, 1);
3097 if (mode != old_mode)
3098 val = convert_modes (mode, old_mode, val, unsignedp);
3100 if (GET_CODE (return_reg) == PARALLEL)
3101 emit_group_load (return_reg, val, type, int_size_in_bytes (type));
3102 else
3103 emit_move_insn (return_reg, val);
3106 expand_null_return_1 ();
3109 /* Generate RTL to evaluate the expression RETVAL and return it
3110 from the current function. */
3112 static void
3113 expand_return (tree retval)
3115 rtx result_rtl;
3116 rtx val = 0;
3117 tree retval_rhs;
3119 /* If function wants no value, give it none. */
3120 if (TREE_CODE (TREE_TYPE (TREE_TYPE (current_function_decl))) == VOID_TYPE)
3122 expand_normal (retval);
3123 expand_null_return ();
3124 return;
3127 if (retval == error_mark_node)
3129 /* Treat this like a return of no value from a function that
3130 returns a value. */
3131 expand_null_return ();
3132 return;
3134 else if ((TREE_CODE (retval) == MODIFY_EXPR
3135 || TREE_CODE (retval) == INIT_EXPR)
3136 && TREE_CODE (TREE_OPERAND (retval, 0)) == RESULT_DECL)
3137 retval_rhs = TREE_OPERAND (retval, 1);
3138 else
3139 retval_rhs = retval;
3141 result_rtl = DECL_RTL (DECL_RESULT (current_function_decl));
3143 /* If we are returning the RESULT_DECL, then the value has already
3144 been stored into it, so we don't have to do anything special. */
3145 if (TREE_CODE (retval_rhs) == RESULT_DECL)
3146 expand_value_return (result_rtl);
3148 /* If the result is an aggregate that is being returned in one (or more)
3149 registers, load the registers here. */
3151 else if (retval_rhs != 0
3152 && TYPE_MODE (TREE_TYPE (retval_rhs)) == BLKmode
3153 && REG_P (result_rtl))
3155 val = copy_blkmode_to_reg (GET_MODE (result_rtl), retval_rhs);
3156 if (val)
3158 /* Use the mode of the result value on the return register. */
3159 PUT_MODE (result_rtl, GET_MODE (val));
3160 expand_value_return (val);
3162 else
3163 expand_null_return ();
3165 else if (retval_rhs != 0
3166 && !VOID_TYPE_P (TREE_TYPE (retval_rhs))
3167 && (REG_P (result_rtl)
3168 || (GET_CODE (result_rtl) == PARALLEL)))
3170 /* Compute the return value into a temporary (usually a pseudo reg). */
3172 = assign_temp (TREE_TYPE (DECL_RESULT (current_function_decl)), 0, 1);
3173 val = expand_expr (retval_rhs, val, GET_MODE (val), EXPAND_NORMAL);
3174 val = force_not_mem (val);
3175 expand_value_return (val);
3177 else
3179 /* No hard reg used; calculate value into hard return reg. */
3180 expand_expr (retval, const0_rtx, VOIDmode, EXPAND_NORMAL);
3181 expand_value_return (result_rtl);
3185 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
3186 STMT that doesn't require special handling for outgoing edges. That
3187 is no tailcalls and no GIMPLE_COND. */
3189 static void
3190 expand_gimple_stmt_1 (gimple stmt)
3192 tree op0;
3194 set_curr_insn_location (gimple_location (stmt));
3196 switch (gimple_code (stmt))
3198 case GIMPLE_GOTO:
3199 op0 = gimple_goto_dest (stmt);
3200 if (TREE_CODE (op0) == LABEL_DECL)
3201 expand_goto (op0);
3202 else
3203 expand_computed_goto (op0);
3204 break;
3205 case GIMPLE_LABEL:
3206 expand_label (gimple_label_label (stmt));
3207 break;
3208 case GIMPLE_NOP:
3209 case GIMPLE_PREDICT:
3210 break;
3211 case GIMPLE_SWITCH:
3212 expand_case (stmt);
3213 break;
3214 case GIMPLE_ASM:
3215 expand_asm_stmt (stmt);
3216 break;
3217 case GIMPLE_CALL:
3218 expand_call_stmt (stmt);
3219 break;
3221 case GIMPLE_RETURN:
3222 op0 = gimple_return_retval (stmt);
3224 if (op0 && op0 != error_mark_node)
3226 tree result = DECL_RESULT (current_function_decl);
3228 /* If we are not returning the current function's RESULT_DECL,
3229 build an assignment to it. */
3230 if (op0 != result)
3232 /* I believe that a function's RESULT_DECL is unique. */
3233 gcc_assert (TREE_CODE (op0) != RESULT_DECL);
3235 /* ??? We'd like to use simply expand_assignment here,
3236 but this fails if the value is of BLKmode but the return
3237 decl is a register. expand_return has special handling
3238 for this combination, which eventually should move
3239 to common code. See comments there. Until then, let's
3240 build a modify expression :-/ */
3241 op0 = build2 (MODIFY_EXPR, TREE_TYPE (result),
3242 result, op0);
3245 if (!op0)
3246 expand_null_return ();
3247 else
3248 expand_return (op0);
3249 break;
3251 case GIMPLE_ASSIGN:
3253 tree lhs = gimple_assign_lhs (stmt);
3255 /* Tree expand used to fiddle with |= and &= of two bitfield
3256 COMPONENT_REFs here. This can't happen with gimple, the LHS
3257 of binary assigns must be a gimple reg. */
3259 if (TREE_CODE (lhs) != SSA_NAME
3260 || get_gimple_rhs_class (gimple_expr_code (stmt))
3261 == GIMPLE_SINGLE_RHS)
3263 tree rhs = gimple_assign_rhs1 (stmt);
3264 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt))
3265 == GIMPLE_SINGLE_RHS);
3266 if (gimple_has_location (stmt) && CAN_HAVE_LOCATION_P (rhs))
3267 SET_EXPR_LOCATION (rhs, gimple_location (stmt));
3268 if (TREE_CLOBBER_P (rhs))
3269 /* This is a clobber to mark the going out of scope for
3270 this LHS. */
3272 else
3273 expand_assignment (lhs, rhs,
3274 gimple_assign_nontemporal_move_p (stmt));
3276 else
3278 rtx target, temp;
3279 bool nontemporal = gimple_assign_nontemporal_move_p (stmt);
3280 struct separate_ops ops;
3281 bool promoted = false;
3283 target = expand_expr (lhs, NULL_RTX, VOIDmode, EXPAND_WRITE);
3284 if (GET_CODE (target) == SUBREG && SUBREG_PROMOTED_VAR_P (target))
3285 promoted = true;
3287 ops.code = gimple_assign_rhs_code (stmt);
3288 ops.type = TREE_TYPE (lhs);
3289 switch (get_gimple_rhs_class (gimple_expr_code (stmt)))
3291 case GIMPLE_TERNARY_RHS:
3292 ops.op2 = gimple_assign_rhs3 (stmt);
3293 /* Fallthru */
3294 case GIMPLE_BINARY_RHS:
3295 ops.op1 = gimple_assign_rhs2 (stmt);
3296 /* Fallthru */
3297 case GIMPLE_UNARY_RHS:
3298 ops.op0 = gimple_assign_rhs1 (stmt);
3299 break;
3300 default:
3301 gcc_unreachable ();
3303 ops.location = gimple_location (stmt);
3305 /* If we want to use a nontemporal store, force the value to
3306 register first. If we store into a promoted register,
3307 don't directly expand to target. */
3308 temp = nontemporal || promoted ? NULL_RTX : target;
3309 temp = expand_expr_real_2 (&ops, temp, GET_MODE (target),
3310 EXPAND_NORMAL);
3312 if (temp == target)
3314 else if (promoted)
3316 int unsignedp = SUBREG_PROMOTED_SIGN (target);
3317 /* If TEMP is a VOIDmode constant, use convert_modes to make
3318 sure that we properly convert it. */
3319 if (CONSTANT_P (temp) && GET_MODE (temp) == VOIDmode)
3321 temp = convert_modes (GET_MODE (target),
3322 TYPE_MODE (ops.type),
3323 temp, unsignedp);
3324 temp = convert_modes (GET_MODE (SUBREG_REG (target)),
3325 GET_MODE (target), temp, unsignedp);
3328 convert_move (SUBREG_REG (target), temp, unsignedp);
3330 else if (nontemporal && emit_storent_insn (target, temp))
3332 else
3334 temp = force_operand (temp, target);
3335 if (temp != target)
3336 emit_move_insn (target, temp);
3340 break;
3342 default:
3343 gcc_unreachable ();
3347 /* Expand one gimple statement STMT and return the last RTL instruction
3348 before any of the newly generated ones.
3350 In addition to generating the necessary RTL instructions this also
3351 sets REG_EH_REGION notes if necessary and sets the current source
3352 location for diagnostics. */
3354 static rtx_insn *
3355 expand_gimple_stmt (gimple stmt)
3357 location_t saved_location = input_location;
3358 rtx_insn *last = get_last_insn ();
3359 int lp_nr;
3361 gcc_assert (cfun);
3363 /* We need to save and restore the current source location so that errors
3364 discovered during expansion are emitted with the right location. But
3365 it would be better if the diagnostic routines used the source location
3366 embedded in the tree nodes rather than globals. */
3367 if (gimple_has_location (stmt))
3368 input_location = gimple_location (stmt);
3370 expand_gimple_stmt_1 (stmt);
3372 /* Free any temporaries used to evaluate this statement. */
3373 free_temp_slots ();
3375 input_location = saved_location;
3377 /* Mark all insns that may trap. */
3378 lp_nr = lookup_stmt_eh_lp (stmt);
3379 if (lp_nr)
3381 rtx_insn *insn;
3382 for (insn = next_real_insn (last); insn;
3383 insn = next_real_insn (insn))
3385 if (! find_reg_note (insn, REG_EH_REGION, NULL_RTX)
3386 /* If we want exceptions for non-call insns, any
3387 may_trap_p instruction may throw. */
3388 && GET_CODE (PATTERN (insn)) != CLOBBER
3389 && GET_CODE (PATTERN (insn)) != USE
3390 && insn_could_throw_p (insn))
3391 make_reg_eh_region_note (insn, 0, lp_nr);
3395 return last;
3398 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
3399 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
3400 generated a tail call (something that might be denied by the ABI
3401 rules governing the call; see calls.c).
3403 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
3404 can still reach the rest of BB. The case here is __builtin_sqrt,
3405 where the NaN result goes through the external function (with a
3406 tailcall) and the normal result happens via a sqrt instruction. */
3408 static basic_block
3409 expand_gimple_tailcall (basic_block bb, gimple stmt, bool *can_fallthru)
3411 rtx_insn *last2, *last;
3412 edge e;
3413 edge_iterator ei;
3414 int probability;
3415 gcov_type count;
3417 last2 = last = expand_gimple_stmt (stmt);
3419 for (last = NEXT_INSN (last); last; last = NEXT_INSN (last))
3420 if (CALL_P (last) && SIBLING_CALL_P (last))
3421 goto found;
3423 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3425 *can_fallthru = true;
3426 return NULL;
3428 found:
3429 /* ??? Wouldn't it be better to just reset any pending stack adjust?
3430 Any instructions emitted here are about to be deleted. */
3431 do_pending_stack_adjust ();
3433 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
3434 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
3435 EH or abnormal edges, we shouldn't have created a tail call in
3436 the first place. So it seems to me we should just be removing
3437 all edges here, or redirecting the existing fallthru edge to
3438 the exit block. */
3440 probability = 0;
3441 count = 0;
3443 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
3445 if (!(e->flags & (EDGE_ABNORMAL | EDGE_EH)))
3447 if (e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3449 e->dest->count -= e->count;
3450 e->dest->frequency -= EDGE_FREQUENCY (e);
3451 if (e->dest->count < 0)
3452 e->dest->count = 0;
3453 if (e->dest->frequency < 0)
3454 e->dest->frequency = 0;
3456 count += e->count;
3457 probability += e->probability;
3458 remove_edge (e);
3460 else
3461 ei_next (&ei);
3464 /* This is somewhat ugly: the call_expr expander often emits instructions
3465 after the sibcall (to perform the function return). These confuse the
3466 find_many_sub_basic_blocks code, so we need to get rid of these. */
3467 last = NEXT_INSN (last);
3468 gcc_assert (BARRIER_P (last));
3470 *can_fallthru = false;
3471 while (NEXT_INSN (last))
3473 /* For instance an sqrt builtin expander expands if with
3474 sibcall in the then and label for `else`. */
3475 if (LABEL_P (NEXT_INSN (last)))
3477 *can_fallthru = true;
3478 break;
3480 delete_insn (NEXT_INSN (last));
3483 e = make_edge (bb, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_ABNORMAL
3484 | EDGE_SIBCALL);
3485 e->probability += probability;
3486 e->count += count;
3487 BB_END (bb) = last;
3488 update_bb_for_insn (bb);
3490 if (NEXT_INSN (last))
3492 bb = create_basic_block (NEXT_INSN (last), get_last_insn (), bb);
3494 last = BB_END (bb);
3495 if (BARRIER_P (last))
3496 BB_END (bb) = PREV_INSN (last);
3499 maybe_dump_rtl_for_gimple_stmt (stmt, last2);
3501 return bb;
3504 /* Return the difference between the floor and the truncated result of
3505 a signed division by OP1 with remainder MOD. */
3506 static rtx
3507 floor_sdiv_adjust (enum machine_mode mode, rtx mod, rtx op1)
3509 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
3510 return gen_rtx_IF_THEN_ELSE
3511 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3512 gen_rtx_IF_THEN_ELSE
3513 (mode, gen_rtx_LT (BImode,
3514 gen_rtx_DIV (mode, op1, mod),
3515 const0_rtx),
3516 constm1_rtx, const0_rtx),
3517 const0_rtx);
3520 /* Return the difference between the ceil and the truncated result of
3521 a signed division by OP1 with remainder MOD. */
3522 static rtx
3523 ceil_sdiv_adjust (enum machine_mode mode, rtx mod, rtx op1)
3525 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
3526 return gen_rtx_IF_THEN_ELSE
3527 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3528 gen_rtx_IF_THEN_ELSE
3529 (mode, gen_rtx_GT (BImode,
3530 gen_rtx_DIV (mode, op1, mod),
3531 const0_rtx),
3532 const1_rtx, const0_rtx),
3533 const0_rtx);
3536 /* Return the difference between the ceil and the truncated result of
3537 an unsigned division by OP1 with remainder MOD. */
3538 static rtx
3539 ceil_udiv_adjust (enum machine_mode mode, rtx mod, rtx op1 ATTRIBUTE_UNUSED)
3541 /* (mod != 0 ? 1 : 0) */
3542 return gen_rtx_IF_THEN_ELSE
3543 (mode, gen_rtx_NE (BImode, mod, const0_rtx),
3544 const1_rtx, const0_rtx);
3547 /* Return the difference between the rounded and the truncated result
3548 of a signed division by OP1 with remainder MOD. Halfway cases are
3549 rounded away from zero, rather than to the nearest even number. */
3550 static rtx
3551 round_sdiv_adjust (enum machine_mode mode, rtx mod, rtx op1)
3553 /* (abs (mod) >= abs (op1) - abs (mod)
3554 ? (op1 / mod > 0 ? 1 : -1)
3555 : 0) */
3556 return gen_rtx_IF_THEN_ELSE
3557 (mode, gen_rtx_GE (BImode, gen_rtx_ABS (mode, mod),
3558 gen_rtx_MINUS (mode,
3559 gen_rtx_ABS (mode, op1),
3560 gen_rtx_ABS (mode, mod))),
3561 gen_rtx_IF_THEN_ELSE
3562 (mode, gen_rtx_GT (BImode,
3563 gen_rtx_DIV (mode, op1, mod),
3564 const0_rtx),
3565 const1_rtx, constm1_rtx),
3566 const0_rtx);
3569 /* Return the difference between the rounded and the truncated result
3570 of a unsigned division by OP1 with remainder MOD. Halfway cases
3571 are rounded away from zero, rather than to the nearest even
3572 number. */
3573 static rtx
3574 round_udiv_adjust (enum machine_mode mode, rtx mod, rtx op1)
3576 /* (mod >= op1 - mod ? 1 : 0) */
3577 return gen_rtx_IF_THEN_ELSE
3578 (mode, gen_rtx_GE (BImode, mod,
3579 gen_rtx_MINUS (mode, op1, mod)),
3580 const1_rtx, const0_rtx);
3583 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
3584 any rtl. */
3586 static rtx
3587 convert_debug_memory_address (enum machine_mode mode, rtx x,
3588 addr_space_t as)
3590 enum machine_mode xmode = GET_MODE (x);
3592 #ifndef POINTERS_EXTEND_UNSIGNED
3593 gcc_assert (mode == Pmode
3594 || mode == targetm.addr_space.address_mode (as));
3595 gcc_assert (xmode == mode || xmode == VOIDmode);
3596 #else
3597 rtx temp;
3599 gcc_assert (targetm.addr_space.valid_pointer_mode (mode, as));
3601 if (GET_MODE (x) == mode || GET_MODE (x) == VOIDmode)
3602 return x;
3604 if (GET_MODE_PRECISION (mode) < GET_MODE_PRECISION (xmode))
3605 x = simplify_gen_subreg (mode, x, xmode,
3606 subreg_lowpart_offset
3607 (mode, xmode));
3608 else if (POINTERS_EXTEND_UNSIGNED > 0)
3609 x = gen_rtx_ZERO_EXTEND (mode, x);
3610 else if (!POINTERS_EXTEND_UNSIGNED)
3611 x = gen_rtx_SIGN_EXTEND (mode, x);
3612 else
3614 switch (GET_CODE (x))
3616 case SUBREG:
3617 if ((SUBREG_PROMOTED_VAR_P (x)
3618 || (REG_P (SUBREG_REG (x)) && REG_POINTER (SUBREG_REG (x)))
3619 || (GET_CODE (SUBREG_REG (x)) == PLUS
3620 && REG_P (XEXP (SUBREG_REG (x), 0))
3621 && REG_POINTER (XEXP (SUBREG_REG (x), 0))
3622 && CONST_INT_P (XEXP (SUBREG_REG (x), 1))))
3623 && GET_MODE (SUBREG_REG (x)) == mode)
3624 return SUBREG_REG (x);
3625 break;
3626 case LABEL_REF:
3627 temp = gen_rtx_LABEL_REF (mode, LABEL_REF_LABEL (x));
3628 LABEL_REF_NONLOCAL_P (temp) = LABEL_REF_NONLOCAL_P (x);
3629 return temp;
3630 case SYMBOL_REF:
3631 temp = shallow_copy_rtx (x);
3632 PUT_MODE (temp, mode);
3633 return temp;
3634 case CONST:
3635 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
3636 if (temp)
3637 temp = gen_rtx_CONST (mode, temp);
3638 return temp;
3639 case PLUS:
3640 case MINUS:
3641 if (CONST_INT_P (XEXP (x, 1)))
3643 temp = convert_debug_memory_address (mode, XEXP (x, 0), as);
3644 if (temp)
3645 return gen_rtx_fmt_ee (GET_CODE (x), mode, temp, XEXP (x, 1));
3647 break;
3648 default:
3649 break;
3651 /* Don't know how to express ptr_extend as operation in debug info. */
3652 return NULL;
3654 #endif /* POINTERS_EXTEND_UNSIGNED */
3656 return x;
3659 /* Return an RTX equivalent to the value of the parameter DECL. */
3661 static rtx
3662 expand_debug_parm_decl (tree decl)
3664 rtx incoming = DECL_INCOMING_RTL (decl);
3666 if (incoming
3667 && GET_MODE (incoming) != BLKmode
3668 && ((REG_P (incoming) && HARD_REGISTER_P (incoming))
3669 || (MEM_P (incoming)
3670 && REG_P (XEXP (incoming, 0))
3671 && HARD_REGISTER_P (XEXP (incoming, 0)))))
3673 rtx rtl = gen_rtx_ENTRY_VALUE (GET_MODE (incoming));
3675 #ifdef HAVE_window_save
3676 /* DECL_INCOMING_RTL uses the INCOMING_REGNO of parameter registers.
3677 If the target machine has an explicit window save instruction, the
3678 actual entry value is the corresponding OUTGOING_REGNO instead. */
3679 if (REG_P (incoming)
3680 && OUTGOING_REGNO (REGNO (incoming)) != REGNO (incoming))
3681 incoming
3682 = gen_rtx_REG_offset (incoming, GET_MODE (incoming),
3683 OUTGOING_REGNO (REGNO (incoming)), 0);
3684 else if (MEM_P (incoming))
3686 rtx reg = XEXP (incoming, 0);
3687 if (OUTGOING_REGNO (REGNO (reg)) != REGNO (reg))
3689 reg = gen_raw_REG (GET_MODE (reg), OUTGOING_REGNO (REGNO (reg)));
3690 incoming = replace_equiv_address_nv (incoming, reg);
3692 else
3693 incoming = copy_rtx (incoming);
3695 #endif
3697 ENTRY_VALUE_EXP (rtl) = incoming;
3698 return rtl;
3701 if (incoming
3702 && GET_MODE (incoming) != BLKmode
3703 && !TREE_ADDRESSABLE (decl)
3704 && MEM_P (incoming)
3705 && (XEXP (incoming, 0) == virtual_incoming_args_rtx
3706 || (GET_CODE (XEXP (incoming, 0)) == PLUS
3707 && XEXP (XEXP (incoming, 0), 0) == virtual_incoming_args_rtx
3708 && CONST_INT_P (XEXP (XEXP (incoming, 0), 1)))))
3709 return copy_rtx (incoming);
3711 return NULL_RTX;
3714 /* Return an RTX equivalent to the value of the tree expression EXP. */
3716 static rtx
3717 expand_debug_expr (tree exp)
3719 rtx op0 = NULL_RTX, op1 = NULL_RTX, op2 = NULL_RTX;
3720 enum machine_mode mode = TYPE_MODE (TREE_TYPE (exp));
3721 enum machine_mode inner_mode = VOIDmode;
3722 int unsignedp = TYPE_UNSIGNED (TREE_TYPE (exp));
3723 addr_space_t as;
3725 switch (TREE_CODE_CLASS (TREE_CODE (exp)))
3727 case tcc_expression:
3728 switch (TREE_CODE (exp))
3730 case COND_EXPR:
3731 case DOT_PROD_EXPR:
3732 case SAD_EXPR:
3733 case WIDEN_MULT_PLUS_EXPR:
3734 case WIDEN_MULT_MINUS_EXPR:
3735 case FMA_EXPR:
3736 goto ternary;
3738 case TRUTH_ANDIF_EXPR:
3739 case TRUTH_ORIF_EXPR:
3740 case TRUTH_AND_EXPR:
3741 case TRUTH_OR_EXPR:
3742 case TRUTH_XOR_EXPR:
3743 goto binary;
3745 case TRUTH_NOT_EXPR:
3746 goto unary;
3748 default:
3749 break;
3751 break;
3753 ternary:
3754 op2 = expand_debug_expr (TREE_OPERAND (exp, 2));
3755 if (!op2)
3756 return NULL_RTX;
3757 /* Fall through. */
3759 binary:
3760 case tcc_binary:
3761 case tcc_comparison:
3762 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
3763 if (!op1)
3764 return NULL_RTX;
3765 /* Fall through. */
3767 unary:
3768 case tcc_unary:
3769 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
3770 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
3771 if (!op0)
3772 return NULL_RTX;
3773 break;
3775 case tcc_type:
3776 case tcc_statement:
3777 gcc_unreachable ();
3779 case tcc_constant:
3780 case tcc_exceptional:
3781 case tcc_declaration:
3782 case tcc_reference:
3783 case tcc_vl_exp:
3784 break;
3787 switch (TREE_CODE (exp))
3789 case STRING_CST:
3790 if (!lookup_constant_def (exp))
3792 if (strlen (TREE_STRING_POINTER (exp)) + 1
3793 != (size_t) TREE_STRING_LENGTH (exp))
3794 return NULL_RTX;
3795 op0 = gen_rtx_CONST_STRING (Pmode, TREE_STRING_POINTER (exp));
3796 op0 = gen_rtx_MEM (BLKmode, op0);
3797 set_mem_attributes (op0, exp, 0);
3798 return op0;
3800 /* Fall through... */
3802 case INTEGER_CST:
3803 case REAL_CST:
3804 case FIXED_CST:
3805 op0 = expand_expr (exp, NULL_RTX, mode, EXPAND_INITIALIZER);
3806 return op0;
3808 case COMPLEX_CST:
3809 gcc_assert (COMPLEX_MODE_P (mode));
3810 op0 = expand_debug_expr (TREE_REALPART (exp));
3811 op1 = expand_debug_expr (TREE_IMAGPART (exp));
3812 return gen_rtx_CONCAT (mode, op0, op1);
3814 case DEBUG_EXPR_DECL:
3815 op0 = DECL_RTL_IF_SET (exp);
3817 if (op0)
3818 return op0;
3820 op0 = gen_rtx_DEBUG_EXPR (mode);
3821 DEBUG_EXPR_TREE_DECL (op0) = exp;
3822 SET_DECL_RTL (exp, op0);
3824 return op0;
3826 case VAR_DECL:
3827 case PARM_DECL:
3828 case FUNCTION_DECL:
3829 case LABEL_DECL:
3830 case CONST_DECL:
3831 case RESULT_DECL:
3832 op0 = DECL_RTL_IF_SET (exp);
3834 /* This decl was probably optimized away. */
3835 if (!op0)
3837 if (TREE_CODE (exp) != VAR_DECL
3838 || DECL_EXTERNAL (exp)
3839 || !TREE_STATIC (exp)
3840 || !DECL_NAME (exp)
3841 || DECL_HARD_REGISTER (exp)
3842 || DECL_IN_CONSTANT_POOL (exp)
3843 || mode == VOIDmode)
3844 return NULL;
3846 op0 = make_decl_rtl_for_debug (exp);
3847 if (!MEM_P (op0)
3848 || GET_CODE (XEXP (op0, 0)) != SYMBOL_REF
3849 || SYMBOL_REF_DECL (XEXP (op0, 0)) != exp)
3850 return NULL;
3852 else
3853 op0 = copy_rtx (op0);
3855 if (GET_MODE (op0) == BLKmode
3856 /* If op0 is not BLKmode, but BLKmode is, adjust_mode
3857 below would ICE. While it is likely a FE bug,
3858 try to be robust here. See PR43166. */
3859 || mode == BLKmode
3860 || (mode == VOIDmode && GET_MODE (op0) != VOIDmode))
3862 gcc_assert (MEM_P (op0));
3863 op0 = adjust_address_nv (op0, mode, 0);
3864 return op0;
3867 /* Fall through. */
3869 adjust_mode:
3870 case PAREN_EXPR:
3871 case NOP_EXPR:
3872 case CONVERT_EXPR:
3874 inner_mode = GET_MODE (op0);
3876 if (mode == inner_mode)
3877 return op0;
3879 if (inner_mode == VOIDmode)
3881 if (TREE_CODE (exp) == SSA_NAME)
3882 inner_mode = TYPE_MODE (TREE_TYPE (exp));
3883 else
3884 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
3885 if (mode == inner_mode)
3886 return op0;
3889 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
3891 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
3892 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
3893 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
3894 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
3895 else
3896 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
3898 else if (FLOAT_MODE_P (mode))
3900 gcc_assert (TREE_CODE (exp) != SSA_NAME);
3901 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
3902 op0 = simplify_gen_unary (UNSIGNED_FLOAT, mode, op0, inner_mode);
3903 else
3904 op0 = simplify_gen_unary (FLOAT, mode, op0, inner_mode);
3906 else if (FLOAT_MODE_P (inner_mode))
3908 if (unsignedp)
3909 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
3910 else
3911 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
3913 else if (CONSTANT_P (op0)
3914 || GET_MODE_PRECISION (mode) <= GET_MODE_PRECISION (inner_mode))
3915 op0 = simplify_gen_subreg (mode, op0, inner_mode,
3916 subreg_lowpart_offset (mode,
3917 inner_mode));
3918 else if (TREE_CODE_CLASS (TREE_CODE (exp)) == tcc_unary
3919 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0)))
3920 : unsignedp)
3921 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
3922 else
3923 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
3925 return op0;
3928 case MEM_REF:
3929 if (!is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
3931 tree newexp = fold_binary (MEM_REF, TREE_TYPE (exp),
3932 TREE_OPERAND (exp, 0),
3933 TREE_OPERAND (exp, 1));
3934 if (newexp)
3935 return expand_debug_expr (newexp);
3937 /* FALLTHROUGH */
3938 case INDIRECT_REF:
3939 inner_mode = TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp, 0)));
3940 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
3941 if (!op0)
3942 return NULL;
3944 if (TREE_CODE (exp) == MEM_REF)
3946 if (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
3947 || (GET_CODE (op0) == PLUS
3948 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR))
3949 /* (mem (debug_implicit_ptr)) might confuse aliasing.
3950 Instead just use get_inner_reference. */
3951 goto component_ref;
3953 op1 = expand_debug_expr (TREE_OPERAND (exp, 1));
3954 if (!op1 || !CONST_INT_P (op1))
3955 return NULL;
3957 op0 = plus_constant (inner_mode, op0, INTVAL (op1));
3960 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
3962 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
3963 op0, as);
3964 if (op0 == NULL_RTX)
3965 return NULL;
3967 op0 = gen_rtx_MEM (mode, op0);
3968 set_mem_attributes (op0, exp, 0);
3969 if (TREE_CODE (exp) == MEM_REF
3970 && !is_gimple_mem_ref_addr (TREE_OPERAND (exp, 0)))
3971 set_mem_expr (op0, NULL_TREE);
3972 set_mem_addr_space (op0, as);
3974 return op0;
3976 case TARGET_MEM_REF:
3977 if (TREE_CODE (TMR_BASE (exp)) == ADDR_EXPR
3978 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp), 0)))
3979 return NULL;
3981 op0 = expand_debug_expr
3982 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp)), exp));
3983 if (!op0)
3984 return NULL;
3986 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (TREE_OPERAND (exp, 0))));
3987 op0 = convert_debug_memory_address (targetm.addr_space.address_mode (as),
3988 op0, as);
3989 if (op0 == NULL_RTX)
3990 return NULL;
3992 op0 = gen_rtx_MEM (mode, op0);
3994 set_mem_attributes (op0, exp, 0);
3995 set_mem_addr_space (op0, as);
3997 return op0;
3999 component_ref:
4000 case ARRAY_REF:
4001 case ARRAY_RANGE_REF:
4002 case COMPONENT_REF:
4003 case BIT_FIELD_REF:
4004 case REALPART_EXPR:
4005 case IMAGPART_EXPR:
4006 case VIEW_CONVERT_EXPR:
4008 enum machine_mode mode1;
4009 HOST_WIDE_INT bitsize, bitpos;
4010 tree offset;
4011 int volatilep = 0;
4012 tree tem = get_inner_reference (exp, &bitsize, &bitpos, &offset,
4013 &mode1, &unsignedp, &volatilep, false);
4014 rtx orig_op0;
4016 if (bitsize == 0)
4017 return NULL;
4019 orig_op0 = op0 = expand_debug_expr (tem);
4021 if (!op0)
4022 return NULL;
4024 if (offset)
4026 enum machine_mode addrmode, offmode;
4028 if (!MEM_P (op0))
4029 return NULL;
4031 op0 = XEXP (op0, 0);
4032 addrmode = GET_MODE (op0);
4033 if (addrmode == VOIDmode)
4034 addrmode = Pmode;
4036 op1 = expand_debug_expr (offset);
4037 if (!op1)
4038 return NULL;
4040 offmode = GET_MODE (op1);
4041 if (offmode == VOIDmode)
4042 offmode = TYPE_MODE (TREE_TYPE (offset));
4044 if (addrmode != offmode)
4045 op1 = simplify_gen_subreg (addrmode, op1, offmode,
4046 subreg_lowpart_offset (addrmode,
4047 offmode));
4049 /* Don't use offset_address here, we don't need a
4050 recognizable address, and we don't want to generate
4051 code. */
4052 op0 = gen_rtx_MEM (mode, simplify_gen_binary (PLUS, addrmode,
4053 op0, op1));
4056 if (MEM_P (op0))
4058 if (mode1 == VOIDmode)
4059 /* Bitfield. */
4060 mode1 = smallest_mode_for_size (bitsize, MODE_INT);
4061 if (bitpos >= BITS_PER_UNIT)
4063 op0 = adjust_address_nv (op0, mode1, bitpos / BITS_PER_UNIT);
4064 bitpos %= BITS_PER_UNIT;
4066 else if (bitpos < 0)
4068 HOST_WIDE_INT units
4069 = (-bitpos + BITS_PER_UNIT - 1) / BITS_PER_UNIT;
4070 op0 = adjust_address_nv (op0, mode1, units);
4071 bitpos += units * BITS_PER_UNIT;
4073 else if (bitpos == 0 && bitsize == GET_MODE_BITSIZE (mode))
4074 op0 = adjust_address_nv (op0, mode, 0);
4075 else if (GET_MODE (op0) != mode1)
4076 op0 = adjust_address_nv (op0, mode1, 0);
4077 else
4078 op0 = copy_rtx (op0);
4079 if (op0 == orig_op0)
4080 op0 = shallow_copy_rtx (op0);
4081 set_mem_attributes (op0, exp, 0);
4084 if (bitpos == 0 && mode == GET_MODE (op0))
4085 return op0;
4087 if (bitpos < 0)
4088 return NULL;
4090 if (GET_MODE (op0) == BLKmode)
4091 return NULL;
4093 if ((bitpos % BITS_PER_UNIT) == 0
4094 && bitsize == GET_MODE_BITSIZE (mode1))
4096 enum machine_mode opmode = GET_MODE (op0);
4098 if (opmode == VOIDmode)
4099 opmode = TYPE_MODE (TREE_TYPE (tem));
4101 /* This condition may hold if we're expanding the address
4102 right past the end of an array that turned out not to
4103 be addressable (i.e., the address was only computed in
4104 debug stmts). The gen_subreg below would rightfully
4105 crash, and the address doesn't really exist, so just
4106 drop it. */
4107 if (bitpos >= GET_MODE_BITSIZE (opmode))
4108 return NULL;
4110 if ((bitpos % GET_MODE_BITSIZE (mode)) == 0)
4111 return simplify_gen_subreg (mode, op0, opmode,
4112 bitpos / BITS_PER_UNIT);
4115 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0))
4116 && TYPE_UNSIGNED (TREE_TYPE (exp))
4117 ? SIGN_EXTRACT
4118 : ZERO_EXTRACT, mode,
4119 GET_MODE (op0) != VOIDmode
4120 ? GET_MODE (op0)
4121 : TYPE_MODE (TREE_TYPE (tem)),
4122 op0, GEN_INT (bitsize), GEN_INT (bitpos));
4125 case ABS_EXPR:
4126 return simplify_gen_unary (ABS, mode, op0, mode);
4128 case NEGATE_EXPR:
4129 return simplify_gen_unary (NEG, mode, op0, mode);
4131 case BIT_NOT_EXPR:
4132 return simplify_gen_unary (NOT, mode, op0, mode);
4134 case FLOAT_EXPR:
4135 return simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4136 0)))
4137 ? UNSIGNED_FLOAT : FLOAT, mode, op0,
4138 inner_mode);
4140 case FIX_TRUNC_EXPR:
4141 return simplify_gen_unary (unsignedp ? UNSIGNED_FIX : FIX, mode, op0,
4142 inner_mode);
4144 case POINTER_PLUS_EXPR:
4145 /* For the rare target where pointers are not the same size as
4146 size_t, we need to check for mis-matched modes and correct
4147 the addend. */
4148 if (op0 && op1
4149 && GET_MODE (op0) != VOIDmode && GET_MODE (op1) != VOIDmode
4150 && GET_MODE (op0) != GET_MODE (op1))
4152 if (GET_MODE_BITSIZE (GET_MODE (op0)) < GET_MODE_BITSIZE (GET_MODE (op1))
4153 /* If OP0 is a partial mode, then we must truncate, even if it has
4154 the same bitsize as OP1 as GCC's representation of partial modes
4155 is opaque. */
4156 || (GET_MODE_CLASS (GET_MODE (op0)) == MODE_PARTIAL_INT
4157 && GET_MODE_BITSIZE (GET_MODE (op0)) == GET_MODE_BITSIZE (GET_MODE (op1))))
4158 op1 = simplify_gen_unary (TRUNCATE, GET_MODE (op0), op1,
4159 GET_MODE (op1));
4160 else
4161 /* We always sign-extend, regardless of the signedness of
4162 the operand, because the operand is always unsigned
4163 here even if the original C expression is signed. */
4164 op1 = simplify_gen_unary (SIGN_EXTEND, GET_MODE (op0), op1,
4165 GET_MODE (op1));
4167 /* Fall through. */
4168 case PLUS_EXPR:
4169 return simplify_gen_binary (PLUS, mode, op0, op1);
4171 case MINUS_EXPR:
4172 return simplify_gen_binary (MINUS, mode, op0, op1);
4174 case MULT_EXPR:
4175 return simplify_gen_binary (MULT, mode, op0, op1);
4177 case RDIV_EXPR:
4178 case TRUNC_DIV_EXPR:
4179 case EXACT_DIV_EXPR:
4180 if (unsignedp)
4181 return simplify_gen_binary (UDIV, mode, op0, op1);
4182 else
4183 return simplify_gen_binary (DIV, mode, op0, op1);
4185 case TRUNC_MOD_EXPR:
4186 return simplify_gen_binary (unsignedp ? UMOD : MOD, mode, op0, op1);
4188 case FLOOR_DIV_EXPR:
4189 if (unsignedp)
4190 return simplify_gen_binary (UDIV, mode, op0, op1);
4191 else
4193 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4194 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4195 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4196 return simplify_gen_binary (PLUS, mode, div, adj);
4199 case FLOOR_MOD_EXPR:
4200 if (unsignedp)
4201 return simplify_gen_binary (UMOD, mode, op0, op1);
4202 else
4204 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4205 rtx adj = floor_sdiv_adjust (mode, mod, op1);
4206 adj = simplify_gen_unary (NEG, mode,
4207 simplify_gen_binary (MULT, mode, adj, op1),
4208 mode);
4209 return simplify_gen_binary (PLUS, mode, mod, adj);
4212 case CEIL_DIV_EXPR:
4213 if (unsignedp)
4215 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4216 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4217 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4218 return simplify_gen_binary (PLUS, mode, div, adj);
4220 else
4222 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4223 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4224 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4225 return simplify_gen_binary (PLUS, mode, div, adj);
4228 case CEIL_MOD_EXPR:
4229 if (unsignedp)
4231 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4232 rtx adj = ceil_udiv_adjust (mode, mod, op1);
4233 adj = simplify_gen_unary (NEG, mode,
4234 simplify_gen_binary (MULT, mode, adj, op1),
4235 mode);
4236 return simplify_gen_binary (PLUS, mode, mod, adj);
4238 else
4240 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4241 rtx adj = ceil_sdiv_adjust (mode, mod, op1);
4242 adj = simplify_gen_unary (NEG, mode,
4243 simplify_gen_binary (MULT, mode, adj, op1),
4244 mode);
4245 return simplify_gen_binary (PLUS, mode, mod, adj);
4248 case ROUND_DIV_EXPR:
4249 if (unsignedp)
4251 rtx div = simplify_gen_binary (UDIV, mode, op0, op1);
4252 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4253 rtx adj = round_udiv_adjust (mode, mod, op1);
4254 return simplify_gen_binary (PLUS, mode, div, adj);
4256 else
4258 rtx div = simplify_gen_binary (DIV, mode, op0, op1);
4259 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4260 rtx adj = round_sdiv_adjust (mode, mod, op1);
4261 return simplify_gen_binary (PLUS, mode, div, adj);
4264 case ROUND_MOD_EXPR:
4265 if (unsignedp)
4267 rtx mod = simplify_gen_binary (UMOD, mode, op0, op1);
4268 rtx adj = round_udiv_adjust (mode, mod, op1);
4269 adj = simplify_gen_unary (NEG, mode,
4270 simplify_gen_binary (MULT, mode, adj, op1),
4271 mode);
4272 return simplify_gen_binary (PLUS, mode, mod, adj);
4274 else
4276 rtx mod = simplify_gen_binary (MOD, mode, op0, op1);
4277 rtx adj = round_sdiv_adjust (mode, mod, op1);
4278 adj = simplify_gen_unary (NEG, mode,
4279 simplify_gen_binary (MULT, mode, adj, op1),
4280 mode);
4281 return simplify_gen_binary (PLUS, mode, mod, adj);
4284 case LSHIFT_EXPR:
4285 return simplify_gen_binary (ASHIFT, mode, op0, op1);
4287 case RSHIFT_EXPR:
4288 if (unsignedp)
4289 return simplify_gen_binary (LSHIFTRT, mode, op0, op1);
4290 else
4291 return simplify_gen_binary (ASHIFTRT, mode, op0, op1);
4293 case LROTATE_EXPR:
4294 return simplify_gen_binary (ROTATE, mode, op0, op1);
4296 case RROTATE_EXPR:
4297 return simplify_gen_binary (ROTATERT, mode, op0, op1);
4299 case MIN_EXPR:
4300 return simplify_gen_binary (unsignedp ? UMIN : SMIN, mode, op0, op1);
4302 case MAX_EXPR:
4303 return simplify_gen_binary (unsignedp ? UMAX : SMAX, mode, op0, op1);
4305 case BIT_AND_EXPR:
4306 case TRUTH_AND_EXPR:
4307 return simplify_gen_binary (AND, mode, op0, op1);
4309 case BIT_IOR_EXPR:
4310 case TRUTH_OR_EXPR:
4311 return simplify_gen_binary (IOR, mode, op0, op1);
4313 case BIT_XOR_EXPR:
4314 case TRUTH_XOR_EXPR:
4315 return simplify_gen_binary (XOR, mode, op0, op1);
4317 case TRUTH_ANDIF_EXPR:
4318 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, const0_rtx);
4320 case TRUTH_ORIF_EXPR:
4321 return gen_rtx_IF_THEN_ELSE (mode, op0, const_true_rtx, op1);
4323 case TRUTH_NOT_EXPR:
4324 return simplify_gen_relational (EQ, mode, inner_mode, op0, const0_rtx);
4326 case LT_EXPR:
4327 return simplify_gen_relational (unsignedp ? LTU : LT, mode, inner_mode,
4328 op0, op1);
4330 case LE_EXPR:
4331 return simplify_gen_relational (unsignedp ? LEU : LE, mode, inner_mode,
4332 op0, op1);
4334 case GT_EXPR:
4335 return simplify_gen_relational (unsignedp ? GTU : GT, mode, inner_mode,
4336 op0, op1);
4338 case GE_EXPR:
4339 return simplify_gen_relational (unsignedp ? GEU : GE, mode, inner_mode,
4340 op0, op1);
4342 case EQ_EXPR:
4343 return simplify_gen_relational (EQ, mode, inner_mode, op0, op1);
4345 case NE_EXPR:
4346 return simplify_gen_relational (NE, mode, inner_mode, op0, op1);
4348 case UNORDERED_EXPR:
4349 return simplify_gen_relational (UNORDERED, mode, inner_mode, op0, op1);
4351 case ORDERED_EXPR:
4352 return simplify_gen_relational (ORDERED, mode, inner_mode, op0, op1);
4354 case UNLT_EXPR:
4355 return simplify_gen_relational (UNLT, mode, inner_mode, op0, op1);
4357 case UNLE_EXPR:
4358 return simplify_gen_relational (UNLE, mode, inner_mode, op0, op1);
4360 case UNGT_EXPR:
4361 return simplify_gen_relational (UNGT, mode, inner_mode, op0, op1);
4363 case UNGE_EXPR:
4364 return simplify_gen_relational (UNGE, mode, inner_mode, op0, op1);
4366 case UNEQ_EXPR:
4367 return simplify_gen_relational (UNEQ, mode, inner_mode, op0, op1);
4369 case LTGT_EXPR:
4370 return simplify_gen_relational (LTGT, mode, inner_mode, op0, op1);
4372 case COND_EXPR:
4373 return gen_rtx_IF_THEN_ELSE (mode, op0, op1, op2);
4375 case COMPLEX_EXPR:
4376 gcc_assert (COMPLEX_MODE_P (mode));
4377 if (GET_MODE (op0) == VOIDmode)
4378 op0 = gen_rtx_CONST (GET_MODE_INNER (mode), op0);
4379 if (GET_MODE (op1) == VOIDmode)
4380 op1 = gen_rtx_CONST (GET_MODE_INNER (mode), op1);
4381 return gen_rtx_CONCAT (mode, op0, op1);
4383 case CONJ_EXPR:
4384 if (GET_CODE (op0) == CONCAT)
4385 return gen_rtx_CONCAT (mode, XEXP (op0, 0),
4386 simplify_gen_unary (NEG, GET_MODE_INNER (mode),
4387 XEXP (op0, 1),
4388 GET_MODE_INNER (mode)));
4389 else
4391 enum machine_mode imode = GET_MODE_INNER (mode);
4392 rtx re, im;
4394 if (MEM_P (op0))
4396 re = adjust_address_nv (op0, imode, 0);
4397 im = adjust_address_nv (op0, imode, GET_MODE_SIZE (imode));
4399 else
4401 enum machine_mode ifmode = int_mode_for_mode (mode);
4402 enum machine_mode ihmode = int_mode_for_mode (imode);
4403 rtx halfsize;
4404 if (ifmode == BLKmode || ihmode == BLKmode)
4405 return NULL;
4406 halfsize = GEN_INT (GET_MODE_BITSIZE (ihmode));
4407 re = op0;
4408 if (mode != ifmode)
4409 re = gen_rtx_SUBREG (ifmode, re, 0);
4410 re = gen_rtx_ZERO_EXTRACT (ihmode, re, halfsize, const0_rtx);
4411 if (imode != ihmode)
4412 re = gen_rtx_SUBREG (imode, re, 0);
4413 im = copy_rtx (op0);
4414 if (mode != ifmode)
4415 im = gen_rtx_SUBREG (ifmode, im, 0);
4416 im = gen_rtx_ZERO_EXTRACT (ihmode, im, halfsize, halfsize);
4417 if (imode != ihmode)
4418 im = gen_rtx_SUBREG (imode, im, 0);
4420 im = gen_rtx_NEG (imode, im);
4421 return gen_rtx_CONCAT (mode, re, im);
4424 case ADDR_EXPR:
4425 op0 = expand_debug_expr (TREE_OPERAND (exp, 0));
4426 if (!op0 || !MEM_P (op0))
4428 if ((TREE_CODE (TREE_OPERAND (exp, 0)) == VAR_DECL
4429 || TREE_CODE (TREE_OPERAND (exp, 0)) == PARM_DECL
4430 || TREE_CODE (TREE_OPERAND (exp, 0)) == RESULT_DECL)
4431 && (!TREE_ADDRESSABLE (TREE_OPERAND (exp, 0))
4432 || target_for_debug_bind (TREE_OPERAND (exp, 0))))
4433 return gen_rtx_DEBUG_IMPLICIT_PTR (mode, TREE_OPERAND (exp, 0));
4435 if (handled_component_p (TREE_OPERAND (exp, 0)))
4437 HOST_WIDE_INT bitoffset, bitsize, maxsize;
4438 tree decl
4439 = get_ref_base_and_extent (TREE_OPERAND (exp, 0),
4440 &bitoffset, &bitsize, &maxsize);
4441 if ((TREE_CODE (decl) == VAR_DECL
4442 || TREE_CODE (decl) == PARM_DECL
4443 || TREE_CODE (decl) == RESULT_DECL)
4444 && (!TREE_ADDRESSABLE (decl)
4445 || target_for_debug_bind (decl))
4446 && (bitoffset % BITS_PER_UNIT) == 0
4447 && bitsize > 0
4448 && bitsize == maxsize)
4450 rtx base = gen_rtx_DEBUG_IMPLICIT_PTR (mode, decl);
4451 return plus_constant (mode, base, bitoffset / BITS_PER_UNIT);
4455 if (TREE_CODE (TREE_OPERAND (exp, 0)) == MEM_REF
4456 && TREE_CODE (TREE_OPERAND (TREE_OPERAND (exp, 0), 0))
4457 == ADDR_EXPR)
4459 op0 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4460 0));
4461 if (op0 != NULL
4462 && (GET_CODE (op0) == DEBUG_IMPLICIT_PTR
4463 || (GET_CODE (op0) == PLUS
4464 && GET_CODE (XEXP (op0, 0)) == DEBUG_IMPLICIT_PTR
4465 && CONST_INT_P (XEXP (op0, 1)))))
4467 op1 = expand_debug_expr (TREE_OPERAND (TREE_OPERAND (exp, 0),
4468 1));
4469 if (!op1 || !CONST_INT_P (op1))
4470 return NULL;
4472 return plus_constant (mode, op0, INTVAL (op1));
4476 return NULL;
4479 as = TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp)));
4480 op0 = convert_debug_memory_address (mode, XEXP (op0, 0), as);
4482 return op0;
4484 case VECTOR_CST:
4486 unsigned i;
4488 op0 = gen_rtx_CONCATN
4489 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4491 for (i = 0; i < VECTOR_CST_NELTS (exp); ++i)
4493 op1 = expand_debug_expr (VECTOR_CST_ELT (exp, i));
4494 if (!op1)
4495 return NULL;
4496 XVECEXP (op0, 0, i) = op1;
4499 return op0;
4502 case CONSTRUCTOR:
4503 if (TREE_CLOBBER_P (exp))
4504 return NULL;
4505 else if (TREE_CODE (TREE_TYPE (exp)) == VECTOR_TYPE)
4507 unsigned i;
4508 tree val;
4510 op0 = gen_rtx_CONCATN
4511 (mode, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp))));
4513 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp), i, val)
4515 op1 = expand_debug_expr (val);
4516 if (!op1)
4517 return NULL;
4518 XVECEXP (op0, 0, i) = op1;
4521 if (i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)))
4523 op1 = expand_debug_expr
4524 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp))));
4526 if (!op1)
4527 return NULL;
4529 for (; i < TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp)); i++)
4530 XVECEXP (op0, 0, i) = op1;
4533 return op0;
4535 else
4536 goto flag_unsupported;
4538 case CALL_EXPR:
4539 /* ??? Maybe handle some builtins? */
4540 return NULL;
4542 case SSA_NAME:
4544 gimple g = get_gimple_for_ssa_name (exp);
4545 if (g)
4547 op0 = expand_debug_expr (gimple_assign_rhs_to_tree (g));
4548 if (!op0)
4549 return NULL;
4551 else
4553 int part = var_to_partition (SA.map, exp);
4555 if (part == NO_PARTITION)
4557 /* If this is a reference to an incoming value of parameter
4558 that is never used in the code or where the incoming
4559 value is never used in the code, use PARM_DECL's
4560 DECL_RTL if set. */
4561 if (SSA_NAME_IS_DEFAULT_DEF (exp)
4562 && TREE_CODE (SSA_NAME_VAR (exp)) == PARM_DECL)
4564 op0 = expand_debug_parm_decl (SSA_NAME_VAR (exp));
4565 if (op0)
4566 goto adjust_mode;
4567 op0 = expand_debug_expr (SSA_NAME_VAR (exp));
4568 if (op0)
4569 goto adjust_mode;
4571 return NULL;
4574 gcc_assert (part >= 0 && (unsigned)part < SA.map->num_partitions);
4576 op0 = copy_rtx (SA.partition_to_pseudo[part]);
4578 goto adjust_mode;
4581 case ERROR_MARK:
4582 return NULL;
4584 /* Vector stuff. For most of the codes we don't have rtl codes. */
4585 case REALIGN_LOAD_EXPR:
4586 case REDUC_MAX_EXPR:
4587 case REDUC_MIN_EXPR:
4588 case REDUC_PLUS_EXPR:
4589 case VEC_COND_EXPR:
4590 case VEC_LSHIFT_EXPR:
4591 case VEC_PACK_FIX_TRUNC_EXPR:
4592 case VEC_PACK_SAT_EXPR:
4593 case VEC_PACK_TRUNC_EXPR:
4594 case VEC_RSHIFT_EXPR:
4595 case VEC_UNPACK_FLOAT_HI_EXPR:
4596 case VEC_UNPACK_FLOAT_LO_EXPR:
4597 case VEC_UNPACK_HI_EXPR:
4598 case VEC_UNPACK_LO_EXPR:
4599 case VEC_WIDEN_MULT_HI_EXPR:
4600 case VEC_WIDEN_MULT_LO_EXPR:
4601 case VEC_WIDEN_MULT_EVEN_EXPR:
4602 case VEC_WIDEN_MULT_ODD_EXPR:
4603 case VEC_WIDEN_LSHIFT_HI_EXPR:
4604 case VEC_WIDEN_LSHIFT_LO_EXPR:
4605 case VEC_PERM_EXPR:
4606 return NULL;
4608 /* Misc codes. */
4609 case ADDR_SPACE_CONVERT_EXPR:
4610 case FIXED_CONVERT_EXPR:
4611 case OBJ_TYPE_REF:
4612 case WITH_SIZE_EXPR:
4613 return NULL;
4615 case DOT_PROD_EXPR:
4616 if (SCALAR_INT_MODE_P (GET_MODE (op0))
4617 && SCALAR_INT_MODE_P (mode))
4620 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4621 0)))
4622 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
4623 inner_mode);
4625 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4626 1)))
4627 ? ZERO_EXTEND : SIGN_EXTEND, mode, op1,
4628 inner_mode);
4629 op0 = simplify_gen_binary (MULT, mode, op0, op1);
4630 return simplify_gen_binary (PLUS, mode, op0, op2);
4632 return NULL;
4634 case WIDEN_MULT_EXPR:
4635 case WIDEN_MULT_PLUS_EXPR:
4636 case WIDEN_MULT_MINUS_EXPR:
4637 if (SCALAR_INT_MODE_P (GET_MODE (op0))
4638 && SCALAR_INT_MODE_P (mode))
4640 inner_mode = GET_MODE (op0);
4641 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 0))))
4642 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4643 else
4644 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4645 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp, 1))))
4646 op1 = simplify_gen_unary (ZERO_EXTEND, mode, op1, inner_mode);
4647 else
4648 op1 = simplify_gen_unary (SIGN_EXTEND, mode, op1, inner_mode);
4649 op0 = simplify_gen_binary (MULT, mode, op0, op1);
4650 if (TREE_CODE (exp) == WIDEN_MULT_EXPR)
4651 return op0;
4652 else if (TREE_CODE (exp) == WIDEN_MULT_PLUS_EXPR)
4653 return simplify_gen_binary (PLUS, mode, op0, op2);
4654 else
4655 return simplify_gen_binary (MINUS, mode, op2, op0);
4657 return NULL;
4659 case MULT_HIGHPART_EXPR:
4660 /* ??? Similar to the above. */
4661 return NULL;
4663 case WIDEN_SUM_EXPR:
4664 case WIDEN_LSHIFT_EXPR:
4665 if (SCALAR_INT_MODE_P (GET_MODE (op0))
4666 && SCALAR_INT_MODE_P (mode))
4669 = simplify_gen_unary (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp,
4670 0)))
4671 ? ZERO_EXTEND : SIGN_EXTEND, mode, op0,
4672 inner_mode);
4673 return simplify_gen_binary (TREE_CODE (exp) == WIDEN_LSHIFT_EXPR
4674 ? ASHIFT : PLUS, mode, op0, op1);
4676 return NULL;
4678 case FMA_EXPR:
4679 return simplify_gen_ternary (FMA, mode, inner_mode, op0, op1, op2);
4681 default:
4682 flag_unsupported:
4683 #ifdef ENABLE_CHECKING
4684 debug_tree (exp);
4685 gcc_unreachable ();
4686 #else
4687 return NULL;
4688 #endif
4692 /* Return an RTX equivalent to the source bind value of the tree expression
4693 EXP. */
4695 static rtx
4696 expand_debug_source_expr (tree exp)
4698 rtx op0 = NULL_RTX;
4699 enum machine_mode mode = VOIDmode, inner_mode;
4701 switch (TREE_CODE (exp))
4703 case PARM_DECL:
4705 mode = DECL_MODE (exp);
4706 op0 = expand_debug_parm_decl (exp);
4707 if (op0)
4708 break;
4709 /* See if this isn't an argument that has been completely
4710 optimized out. */
4711 if (!DECL_RTL_SET_P (exp)
4712 && !DECL_INCOMING_RTL (exp)
4713 && DECL_ABSTRACT_ORIGIN (current_function_decl))
4715 tree aexp = DECL_ORIGIN (exp);
4716 if (DECL_CONTEXT (aexp)
4717 == DECL_ABSTRACT_ORIGIN (current_function_decl))
4719 vec<tree, va_gc> **debug_args;
4720 unsigned int ix;
4721 tree ddecl;
4722 debug_args = decl_debug_args_lookup (current_function_decl);
4723 if (debug_args != NULL)
4725 for (ix = 0; vec_safe_iterate (*debug_args, ix, &ddecl);
4726 ix += 2)
4727 if (ddecl == aexp)
4728 return gen_rtx_DEBUG_PARAMETER_REF (mode, aexp);
4732 break;
4734 default:
4735 break;
4738 if (op0 == NULL_RTX)
4739 return NULL_RTX;
4741 inner_mode = GET_MODE (op0);
4742 if (mode == inner_mode)
4743 return op0;
4745 if (FLOAT_MODE_P (mode) && FLOAT_MODE_P (inner_mode))
4747 if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (inner_mode))
4748 op0 = simplify_gen_subreg (mode, op0, inner_mode, 0);
4749 else if (GET_MODE_BITSIZE (mode) < GET_MODE_BITSIZE (inner_mode))
4750 op0 = simplify_gen_unary (FLOAT_TRUNCATE, mode, op0, inner_mode);
4751 else
4752 op0 = simplify_gen_unary (FLOAT_EXTEND, mode, op0, inner_mode);
4754 else if (FLOAT_MODE_P (mode))
4755 gcc_unreachable ();
4756 else if (FLOAT_MODE_P (inner_mode))
4758 if (TYPE_UNSIGNED (TREE_TYPE (exp)))
4759 op0 = simplify_gen_unary (UNSIGNED_FIX, mode, op0, inner_mode);
4760 else
4761 op0 = simplify_gen_unary (FIX, mode, op0, inner_mode);
4763 else if (CONSTANT_P (op0)
4764 || GET_MODE_BITSIZE (mode) <= GET_MODE_BITSIZE (inner_mode))
4765 op0 = simplify_gen_subreg (mode, op0, inner_mode,
4766 subreg_lowpart_offset (mode, inner_mode));
4767 else if (TYPE_UNSIGNED (TREE_TYPE (exp)))
4768 op0 = simplify_gen_unary (ZERO_EXTEND, mode, op0, inner_mode);
4769 else
4770 op0 = simplify_gen_unary (SIGN_EXTEND, mode, op0, inner_mode);
4772 return op0;
4775 /* Ensure INSN_VAR_LOCATION_LOC (insn) doesn't have unbound complexity.
4776 Allow 4 levels of rtl nesting for most rtl codes, and if we see anything
4777 deeper than that, create DEBUG_EXPRs and emit DEBUG_INSNs before INSN. */
4779 static void
4780 avoid_complex_debug_insns (rtx_insn *insn, rtx *exp_p, int depth)
4782 rtx exp = *exp_p;
4784 if (exp == NULL_RTX)
4785 return;
4787 if ((OBJECT_P (exp) && !MEM_P (exp)) || GET_CODE (exp) == CLOBBER)
4788 return;
4790 if (depth == 4)
4792 /* Create DEBUG_EXPR (and DEBUG_EXPR_DECL). */
4793 rtx dval = make_debug_expr_from_rtl (exp);
4795 /* Emit a debug bind insn before INSN. */
4796 rtx bind = gen_rtx_VAR_LOCATION (GET_MODE (exp),
4797 DEBUG_EXPR_TREE_DECL (dval), exp,
4798 VAR_INIT_STATUS_INITIALIZED);
4800 emit_debug_insn_before (bind, insn);
4801 *exp_p = dval;
4802 return;
4805 const char *format_ptr = GET_RTX_FORMAT (GET_CODE (exp));
4806 int i, j;
4807 for (i = 0; i < GET_RTX_LENGTH (GET_CODE (exp)); i++)
4808 switch (*format_ptr++)
4810 case 'e':
4811 avoid_complex_debug_insns (insn, &XEXP (exp, i), depth + 1);
4812 break;
4814 case 'E':
4815 case 'V':
4816 for (j = 0; j < XVECLEN (exp, i); j++)
4817 avoid_complex_debug_insns (insn, &XVECEXP (exp, i, j), depth + 1);
4818 break;
4820 default:
4821 break;
4825 /* Expand the _LOCs in debug insns. We run this after expanding all
4826 regular insns, so that any variables referenced in the function
4827 will have their DECL_RTLs set. */
4829 static void
4830 expand_debug_locations (void)
4832 rtx_insn *insn;
4833 rtx_insn *last = get_last_insn ();
4834 int save_strict_alias = flag_strict_aliasing;
4836 /* New alias sets while setting up memory attributes cause
4837 -fcompare-debug failures, even though it doesn't bring about any
4838 codegen changes. */
4839 flag_strict_aliasing = 0;
4841 for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
4842 if (DEBUG_INSN_P (insn))
4844 tree value = (tree)INSN_VAR_LOCATION_LOC (insn);
4845 rtx val;
4846 rtx_insn *prev_insn, *insn2;
4847 enum machine_mode mode;
4849 if (value == NULL_TREE)
4850 val = NULL_RTX;
4851 else
4853 if (INSN_VAR_LOCATION_STATUS (insn)
4854 == VAR_INIT_STATUS_UNINITIALIZED)
4855 val = expand_debug_source_expr (value);
4856 else
4857 val = expand_debug_expr (value);
4858 gcc_assert (last == get_last_insn ());
4861 if (!val)
4862 val = gen_rtx_UNKNOWN_VAR_LOC ();
4863 else
4865 mode = GET_MODE (INSN_VAR_LOCATION (insn));
4867 gcc_assert (mode == GET_MODE (val)
4868 || (GET_MODE (val) == VOIDmode
4869 && (CONST_SCALAR_INT_P (val)
4870 || GET_CODE (val) == CONST_FIXED
4871 || GET_CODE (val) == LABEL_REF)));
4874 INSN_VAR_LOCATION_LOC (insn) = val;
4875 prev_insn = PREV_INSN (insn);
4876 for (insn2 = insn; insn2 != prev_insn; insn2 = PREV_INSN (insn2))
4877 avoid_complex_debug_insns (insn2, &INSN_VAR_LOCATION_LOC (insn2), 0);
4880 flag_strict_aliasing = save_strict_alias;
4883 /* Expand basic block BB from GIMPLE trees to RTL. */
4885 static basic_block
4886 expand_gimple_basic_block (basic_block bb, bool disable_tail_calls)
4888 gimple_stmt_iterator gsi;
4889 gimple_seq stmts;
4890 gimple stmt = NULL;
4891 rtx_note *note;
4892 rtx_insn *last;
4893 edge e;
4894 edge_iterator ei;
4896 if (dump_file)
4897 fprintf (dump_file, "\n;; Generating RTL for gimple basic block %d\n",
4898 bb->index);
4900 /* Note that since we are now transitioning from GIMPLE to RTL, we
4901 cannot use the gsi_*_bb() routines because they expect the basic
4902 block to be in GIMPLE, instead of RTL. Therefore, we need to
4903 access the BB sequence directly. */
4904 stmts = bb_seq (bb);
4905 bb->il.gimple.seq = NULL;
4906 bb->il.gimple.phi_nodes = NULL;
4907 rtl_profile_for_bb (bb);
4908 init_rtl_bb_info (bb);
4909 bb->flags |= BB_RTL;
4911 /* Remove the RETURN_EXPR if we may fall though to the exit
4912 instead. */
4913 gsi = gsi_last (stmts);
4914 if (!gsi_end_p (gsi)
4915 && gimple_code (gsi_stmt (gsi)) == GIMPLE_RETURN)
4917 gimple ret_stmt = gsi_stmt (gsi);
4919 gcc_assert (single_succ_p (bb));
4920 gcc_assert (single_succ (bb) == EXIT_BLOCK_PTR_FOR_FN (cfun));
4922 if (bb->next_bb == EXIT_BLOCK_PTR_FOR_FN (cfun)
4923 && !gimple_return_retval (ret_stmt))
4925 gsi_remove (&gsi, false);
4926 single_succ_edge (bb)->flags |= EDGE_FALLTHRU;
4930 gsi = gsi_start (stmts);
4931 if (!gsi_end_p (gsi))
4933 stmt = gsi_stmt (gsi);
4934 if (gimple_code (stmt) != GIMPLE_LABEL)
4935 stmt = NULL;
4938 rtx_code_label **elt = lab_rtx_for_bb->get (bb);
4940 if (stmt || elt)
4942 last = get_last_insn ();
4944 if (stmt)
4946 expand_gimple_stmt (stmt);
4947 gsi_next (&gsi);
4950 if (elt)
4951 emit_label (*elt);
4953 /* Java emits line number notes in the top of labels.
4954 ??? Make this go away once line number notes are obsoleted. */
4955 BB_HEAD (bb) = NEXT_INSN (last);
4956 if (NOTE_P (BB_HEAD (bb)))
4957 BB_HEAD (bb) = NEXT_INSN (BB_HEAD (bb));
4958 note = emit_note_after (NOTE_INSN_BASIC_BLOCK, BB_HEAD (bb));
4960 maybe_dump_rtl_for_gimple_stmt (stmt, last);
4962 else
4963 BB_HEAD (bb) = note = emit_note (NOTE_INSN_BASIC_BLOCK);
4965 NOTE_BASIC_BLOCK (note) = bb;
4967 for (; !gsi_end_p (gsi); gsi_next (&gsi))
4969 basic_block new_bb;
4971 stmt = gsi_stmt (gsi);
4973 /* If this statement is a non-debug one, and we generate debug
4974 insns, then this one might be the last real use of a TERed
4975 SSA_NAME, but where there are still some debug uses further
4976 down. Expanding the current SSA name in such further debug
4977 uses by their RHS might lead to wrong debug info, as coalescing
4978 might make the operands of such RHS be placed into the same
4979 pseudo as something else. Like so:
4980 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
4981 use(a_1);
4982 a_2 = ...
4983 #DEBUG ... => a_1
4984 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
4985 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
4986 the write to a_2 would actually have clobbered the place which
4987 formerly held a_0.
4989 So, instead of that, we recognize the situation, and generate
4990 debug temporaries at the last real use of TERed SSA names:
4991 a_1 = a_0 + 1;
4992 #DEBUG #D1 => a_1
4993 use(a_1);
4994 a_2 = ...
4995 #DEBUG ... => #D1
4997 if (MAY_HAVE_DEBUG_INSNS
4998 && SA.values
4999 && !is_gimple_debug (stmt))
5001 ssa_op_iter iter;
5002 tree op;
5003 gimple def;
5005 location_t sloc = curr_insn_location ();
5007 /* Look for SSA names that have their last use here (TERed
5008 names always have only one real use). */
5009 FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
5010 if ((def = get_gimple_for_ssa_name (op)))
5012 imm_use_iterator imm_iter;
5013 use_operand_p use_p;
5014 bool have_debug_uses = false;
5016 FOR_EACH_IMM_USE_FAST (use_p, imm_iter, op)
5018 if (gimple_debug_bind_p (USE_STMT (use_p)))
5020 have_debug_uses = true;
5021 break;
5025 if (have_debug_uses)
5027 /* OP is a TERed SSA name, with DEF it's defining
5028 statement, and where OP is used in further debug
5029 instructions. Generate a debug temporary, and
5030 replace all uses of OP in debug insns with that
5031 temporary. */
5032 gimple debugstmt;
5033 tree value = gimple_assign_rhs_to_tree (def);
5034 tree vexpr = make_node (DEBUG_EXPR_DECL);
5035 rtx val;
5036 enum machine_mode mode;
5038 set_curr_insn_location (gimple_location (def));
5040 DECL_ARTIFICIAL (vexpr) = 1;
5041 TREE_TYPE (vexpr) = TREE_TYPE (value);
5042 if (DECL_P (value))
5043 mode = DECL_MODE (value);
5044 else
5045 mode = TYPE_MODE (TREE_TYPE (value));
5046 DECL_MODE (vexpr) = mode;
5048 val = gen_rtx_VAR_LOCATION
5049 (mode, vexpr, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5051 emit_debug_insn (val);
5053 FOR_EACH_IMM_USE_STMT (debugstmt, imm_iter, op)
5055 if (!gimple_debug_bind_p (debugstmt))
5056 continue;
5058 FOR_EACH_IMM_USE_ON_STMT (use_p, imm_iter)
5059 SET_USE (use_p, vexpr);
5061 update_stmt (debugstmt);
5065 set_curr_insn_location (sloc);
5068 currently_expanding_gimple_stmt = stmt;
5070 /* Expand this statement, then evaluate the resulting RTL and
5071 fixup the CFG accordingly. */
5072 if (gimple_code (stmt) == GIMPLE_COND)
5074 new_bb = expand_gimple_cond (bb, stmt);
5075 if (new_bb)
5076 return new_bb;
5078 else if (gimple_debug_bind_p (stmt))
5080 location_t sloc = curr_insn_location ();
5081 gimple_stmt_iterator nsi = gsi;
5083 for (;;)
5085 tree var = gimple_debug_bind_get_var (stmt);
5086 tree value;
5087 rtx val;
5088 enum machine_mode mode;
5090 if (TREE_CODE (var) != DEBUG_EXPR_DECL
5091 && TREE_CODE (var) != LABEL_DECL
5092 && !target_for_debug_bind (var))
5093 goto delink_debug_stmt;
5095 if (gimple_debug_bind_has_value_p (stmt))
5096 value = gimple_debug_bind_get_value (stmt);
5097 else
5098 value = NULL_TREE;
5100 last = get_last_insn ();
5102 set_curr_insn_location (gimple_location (stmt));
5104 if (DECL_P (var))
5105 mode = DECL_MODE (var);
5106 else
5107 mode = TYPE_MODE (TREE_TYPE (var));
5109 val = gen_rtx_VAR_LOCATION
5110 (mode, var, (rtx)value, VAR_INIT_STATUS_INITIALIZED);
5112 emit_debug_insn (val);
5114 if (dump_file && (dump_flags & TDF_DETAILS))
5116 /* We can't dump the insn with a TREE where an RTX
5117 is expected. */
5118 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5119 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5120 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5123 delink_debug_stmt:
5124 /* In order not to generate too many debug temporaries,
5125 we delink all uses of debug statements we already expanded.
5126 Therefore debug statements between definition and real
5127 use of TERed SSA names will continue to use the SSA name,
5128 and not be replaced with debug temps. */
5129 delink_stmt_imm_use (stmt);
5131 gsi = nsi;
5132 gsi_next (&nsi);
5133 if (gsi_end_p (nsi))
5134 break;
5135 stmt = gsi_stmt (nsi);
5136 if (!gimple_debug_bind_p (stmt))
5137 break;
5140 set_curr_insn_location (sloc);
5142 else if (gimple_debug_source_bind_p (stmt))
5144 location_t sloc = curr_insn_location ();
5145 tree var = gimple_debug_source_bind_get_var (stmt);
5146 tree value = gimple_debug_source_bind_get_value (stmt);
5147 rtx val;
5148 enum machine_mode mode;
5150 last = get_last_insn ();
5152 set_curr_insn_location (gimple_location (stmt));
5154 mode = DECL_MODE (var);
5156 val = gen_rtx_VAR_LOCATION (mode, var, (rtx)value,
5157 VAR_INIT_STATUS_UNINITIALIZED);
5159 emit_debug_insn (val);
5161 if (dump_file && (dump_flags & TDF_DETAILS))
5163 /* We can't dump the insn with a TREE where an RTX
5164 is expected. */
5165 PAT_VAR_LOCATION_LOC (val) = const0_rtx;
5166 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5167 PAT_VAR_LOCATION_LOC (val) = (rtx)value;
5170 set_curr_insn_location (sloc);
5172 else
5174 if (is_gimple_call (stmt)
5175 && gimple_call_tail_p (stmt)
5176 && disable_tail_calls)
5177 gimple_call_set_tail (stmt, false);
5179 if (is_gimple_call (stmt) && gimple_call_tail_p (stmt))
5181 bool can_fallthru;
5182 new_bb = expand_gimple_tailcall (bb, stmt, &can_fallthru);
5183 if (new_bb)
5185 if (can_fallthru)
5186 bb = new_bb;
5187 else
5188 return new_bb;
5191 else
5193 def_operand_p def_p;
5194 def_p = SINGLE_SSA_DEF_OPERAND (stmt, SSA_OP_DEF);
5196 if (def_p != NULL)
5198 /* Ignore this stmt if it is in the list of
5199 replaceable expressions. */
5200 if (SA.values
5201 && bitmap_bit_p (SA.values,
5202 SSA_NAME_VERSION (DEF_FROM_PTR (def_p))))
5203 continue;
5205 last = expand_gimple_stmt (stmt);
5206 maybe_dump_rtl_for_gimple_stmt (stmt, last);
5211 currently_expanding_gimple_stmt = NULL;
5213 /* Expand implicit goto and convert goto_locus. */
5214 FOR_EACH_EDGE (e, ei, bb->succs)
5216 if (e->goto_locus != UNKNOWN_LOCATION)
5217 set_curr_insn_location (e->goto_locus);
5218 if ((e->flags & EDGE_FALLTHRU) && e->dest != bb->next_bb)
5220 emit_jump (label_rtx_for_bb (e->dest));
5221 e->flags &= ~EDGE_FALLTHRU;
5225 /* Expanded RTL can create a jump in the last instruction of block.
5226 This later might be assumed to be a jump to successor and break edge insertion.
5227 We need to insert dummy move to prevent this. PR41440. */
5228 if (single_succ_p (bb)
5229 && (single_succ_edge (bb)->flags & EDGE_FALLTHRU)
5230 && (last = get_last_insn ())
5231 && JUMP_P (last))
5233 rtx dummy = gen_reg_rtx (SImode);
5234 emit_insn_after_noloc (gen_move_insn (dummy, dummy), last, NULL);
5237 do_pending_stack_adjust ();
5239 /* Find the block tail. The last insn in the block is the insn
5240 before a barrier and/or table jump insn. */
5241 last = get_last_insn ();
5242 if (BARRIER_P (last))
5243 last = PREV_INSN (last);
5244 if (JUMP_TABLE_DATA_P (last))
5245 last = PREV_INSN (PREV_INSN (last));
5246 BB_END (bb) = last;
5248 update_bb_for_insn (bb);
5250 return bb;
5254 /* Create a basic block for initialization code. */
5256 static basic_block
5257 construct_init_block (void)
5259 basic_block init_block, first_block;
5260 edge e = NULL;
5261 int flags;
5263 /* Multiple entry points not supported yet. */
5264 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR_FOR_FN (cfun)->succs) == 1);
5265 init_rtl_bb_info (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5266 init_rtl_bb_info (EXIT_BLOCK_PTR_FOR_FN (cfun));
5267 ENTRY_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5268 EXIT_BLOCK_PTR_FOR_FN (cfun)->flags |= BB_RTL;
5270 e = EDGE_SUCC (ENTRY_BLOCK_PTR_FOR_FN (cfun), 0);
5272 /* When entry edge points to first basic block, we don't need jump,
5273 otherwise we have to jump into proper target. */
5274 if (e && e->dest != ENTRY_BLOCK_PTR_FOR_FN (cfun)->next_bb)
5276 tree label = gimple_block_label (e->dest);
5278 emit_jump (label_rtx (label));
5279 flags = 0;
5281 else
5282 flags = EDGE_FALLTHRU;
5284 init_block = create_basic_block (NEXT_INSN (get_insns ()),
5285 get_last_insn (),
5286 ENTRY_BLOCK_PTR_FOR_FN (cfun));
5287 init_block->frequency = ENTRY_BLOCK_PTR_FOR_FN (cfun)->frequency;
5288 init_block->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5289 add_bb_to_loop (init_block, ENTRY_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5290 if (e)
5292 first_block = e->dest;
5293 redirect_edge_succ (e, init_block);
5294 e = make_edge (init_block, first_block, flags);
5296 else
5297 e = make_edge (init_block, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_FALLTHRU);
5298 e->probability = REG_BR_PROB_BASE;
5299 e->count = ENTRY_BLOCK_PTR_FOR_FN (cfun)->count;
5301 update_bb_for_insn (init_block);
5302 return init_block;
5305 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
5306 found in the block tree. */
5308 static void
5309 set_block_levels (tree block, int level)
5311 while (block)
5313 BLOCK_NUMBER (block) = level;
5314 set_block_levels (BLOCK_SUBBLOCKS (block), level + 1);
5315 block = BLOCK_CHAIN (block);
5319 /* Create a block containing landing pads and similar stuff. */
5321 static void
5322 construct_exit_block (void)
5324 rtx_insn *head = get_last_insn ();
5325 rtx_insn *end;
5326 basic_block exit_block;
5327 edge e, e2;
5328 unsigned ix;
5329 edge_iterator ei;
5330 basic_block prev_bb = EXIT_BLOCK_PTR_FOR_FN (cfun)->prev_bb;
5331 rtx_insn *orig_end = BB_END (prev_bb);
5333 rtl_profile_for_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5335 /* Make sure the locus is set to the end of the function, so that
5336 epilogue line numbers and warnings are set properly. */
5337 if (LOCATION_LOCUS (cfun->function_end_locus) != UNKNOWN_LOCATION)
5338 input_location = cfun->function_end_locus;
5340 /* Generate rtl for function exit. */
5341 expand_function_end ();
5343 end = get_last_insn ();
5344 if (head == end)
5345 return;
5346 /* While emitting the function end we could move end of the last basic
5347 block. */
5348 BB_END (prev_bb) = orig_end;
5349 while (NEXT_INSN (head) && NOTE_P (NEXT_INSN (head)))
5350 head = NEXT_INSN (head);
5351 /* But make sure exit_block starts with RETURN_LABEL, otherwise the
5352 bb frequency counting will be confused. Any instructions before that
5353 label are emitted for the case where PREV_BB falls through into the
5354 exit block, so append those instructions to prev_bb in that case. */
5355 if (NEXT_INSN (head) != return_label)
5357 while (NEXT_INSN (head) != return_label)
5359 if (!NOTE_P (NEXT_INSN (head)))
5360 BB_END (prev_bb) = NEXT_INSN (head);
5361 head = NEXT_INSN (head);
5364 exit_block = create_basic_block (NEXT_INSN (head), end, prev_bb);
5365 exit_block->frequency = EXIT_BLOCK_PTR_FOR_FN (cfun)->frequency;
5366 exit_block->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5367 add_bb_to_loop (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun)->loop_father);
5369 ix = 0;
5370 while (ix < EDGE_COUNT (EXIT_BLOCK_PTR_FOR_FN (cfun)->preds))
5372 e = EDGE_PRED (EXIT_BLOCK_PTR_FOR_FN (cfun), ix);
5373 if (!(e->flags & EDGE_ABNORMAL))
5374 redirect_edge_succ (e, exit_block);
5375 else
5376 ix++;
5379 e = make_edge (exit_block, EXIT_BLOCK_PTR_FOR_FN (cfun), EDGE_FALLTHRU);
5380 e->probability = REG_BR_PROB_BASE;
5381 e->count = EXIT_BLOCK_PTR_FOR_FN (cfun)->count;
5382 FOR_EACH_EDGE (e2, ei, EXIT_BLOCK_PTR_FOR_FN (cfun)->preds)
5383 if (e2 != e)
5385 e->count -= e2->count;
5386 exit_block->count -= e2->count;
5387 exit_block->frequency -= EDGE_FREQUENCY (e2);
5389 if (e->count < 0)
5390 e->count = 0;
5391 if (exit_block->count < 0)
5392 exit_block->count = 0;
5393 if (exit_block->frequency < 0)
5394 exit_block->frequency = 0;
5395 update_bb_for_insn (exit_block);
5398 /* Helper function for discover_nonconstant_array_refs.
5399 Look for ARRAY_REF nodes with non-constant indexes and mark them
5400 addressable. */
5402 static tree
5403 discover_nonconstant_array_refs_r (tree * tp, int *walk_subtrees,
5404 void *data ATTRIBUTE_UNUSED)
5406 tree t = *tp;
5408 if (IS_TYPE_OR_DECL_P (t))
5409 *walk_subtrees = 0;
5410 else if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5412 while (((TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5413 && is_gimple_min_invariant (TREE_OPERAND (t, 1))
5414 && (!TREE_OPERAND (t, 2)
5415 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5416 || (TREE_CODE (t) == COMPONENT_REF
5417 && (!TREE_OPERAND (t,2)
5418 || is_gimple_min_invariant (TREE_OPERAND (t, 2))))
5419 || TREE_CODE (t) == BIT_FIELD_REF
5420 || TREE_CODE (t) == REALPART_EXPR
5421 || TREE_CODE (t) == IMAGPART_EXPR
5422 || TREE_CODE (t) == VIEW_CONVERT_EXPR
5423 || CONVERT_EXPR_P (t))
5424 t = TREE_OPERAND (t, 0);
5426 if (TREE_CODE (t) == ARRAY_REF || TREE_CODE (t) == ARRAY_RANGE_REF)
5428 t = get_base_address (t);
5429 if (t && DECL_P (t)
5430 && DECL_MODE (t) != BLKmode)
5431 TREE_ADDRESSABLE (t) = 1;
5434 *walk_subtrees = 0;
5437 return NULL_TREE;
5440 /* RTL expansion is not able to compile array references with variable
5441 offsets for arrays stored in single register. Discover such
5442 expressions and mark variables as addressable to avoid this
5443 scenario. */
5445 static void
5446 discover_nonconstant_array_refs (void)
5448 basic_block bb;
5449 gimple_stmt_iterator gsi;
5451 FOR_EACH_BB_FN (bb, cfun)
5452 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
5454 gimple stmt = gsi_stmt (gsi);
5455 if (!is_gimple_debug (stmt))
5456 walk_gimple_op (stmt, discover_nonconstant_array_refs_r, NULL);
5460 /* This function sets crtl->args.internal_arg_pointer to a virtual
5461 register if DRAP is needed. Local register allocator will replace
5462 virtual_incoming_args_rtx with the virtual register. */
5464 static void
5465 expand_stack_alignment (void)
5467 rtx drap_rtx;
5468 unsigned int preferred_stack_boundary;
5470 if (! SUPPORTS_STACK_ALIGNMENT)
5471 return;
5473 if (cfun->calls_alloca
5474 || cfun->has_nonlocal_label
5475 || crtl->has_nonlocal_goto)
5476 crtl->need_drap = true;
5478 /* Call update_stack_boundary here again to update incoming stack
5479 boundary. It may set incoming stack alignment to a different
5480 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
5481 use the minimum incoming stack alignment to check if it is OK
5482 to perform sibcall optimization since sibcall optimization will
5483 only align the outgoing stack to incoming stack boundary. */
5484 if (targetm.calls.update_stack_boundary)
5485 targetm.calls.update_stack_boundary ();
5487 /* The incoming stack frame has to be aligned at least at
5488 parm_stack_boundary. */
5489 gcc_assert (crtl->parm_stack_boundary <= INCOMING_STACK_BOUNDARY);
5491 /* Update crtl->stack_alignment_estimated and use it later to align
5492 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
5493 exceptions since callgraph doesn't collect incoming stack alignment
5494 in this case. */
5495 if (cfun->can_throw_non_call_exceptions
5496 && PREFERRED_STACK_BOUNDARY > crtl->preferred_stack_boundary)
5497 preferred_stack_boundary = PREFERRED_STACK_BOUNDARY;
5498 else
5499 preferred_stack_boundary = crtl->preferred_stack_boundary;
5500 if (preferred_stack_boundary > crtl->stack_alignment_estimated)
5501 crtl->stack_alignment_estimated = preferred_stack_boundary;
5502 if (preferred_stack_boundary > crtl->stack_alignment_needed)
5503 crtl->stack_alignment_needed = preferred_stack_boundary;
5505 gcc_assert (crtl->stack_alignment_needed
5506 <= crtl->stack_alignment_estimated);
5508 crtl->stack_realign_needed
5509 = INCOMING_STACK_BOUNDARY < crtl->stack_alignment_estimated;
5510 crtl->stack_realign_tried = crtl->stack_realign_needed;
5512 crtl->stack_realign_processed = true;
5514 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
5515 alignment. */
5516 gcc_assert (targetm.calls.get_drap_rtx != NULL);
5517 drap_rtx = targetm.calls.get_drap_rtx ();
5519 /* stack_realign_drap and drap_rtx must match. */
5520 gcc_assert ((stack_realign_drap != 0) == (drap_rtx != NULL));
5522 /* Do nothing if NULL is returned, which means DRAP is not needed. */
5523 if (NULL != drap_rtx)
5525 crtl->args.internal_arg_pointer = drap_rtx;
5527 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
5528 needed. */
5529 fixup_tail_calls ();
5534 static void
5535 expand_main_function (void)
5537 #if (defined(INVOKE__main) \
5538 || (!defined(HAS_INIT_SECTION) \
5539 && !defined(INIT_SECTION_ASM_OP) \
5540 && !defined(INIT_ARRAY_SECTION_ASM_OP)))
5541 emit_library_call (init_one_libfunc (NAME__MAIN), LCT_NORMAL, VOIDmode, 0);
5542 #endif
5546 /* Expand code to initialize the stack_protect_guard. This is invoked at
5547 the beginning of a function to be protected. */
5549 #ifndef HAVE_stack_protect_set
5550 # define HAVE_stack_protect_set 0
5551 # define gen_stack_protect_set(x,y) (gcc_unreachable (), NULL_RTX)
5552 #endif
5554 static void
5555 stack_protect_prologue (void)
5557 tree guard_decl = targetm.stack_protect_guard ();
5558 rtx x, y;
5560 x = expand_normal (crtl->stack_protect_guard);
5561 y = expand_normal (guard_decl);
5563 /* Allow the target to copy from Y to X without leaking Y into a
5564 register. */
5565 if (HAVE_stack_protect_set)
5567 rtx insn = gen_stack_protect_set (x, y);
5568 if (insn)
5570 emit_insn (insn);
5571 return;
5575 /* Otherwise do a straight move. */
5576 emit_move_insn (x, y);
5579 /* Translate the intermediate representation contained in the CFG
5580 from GIMPLE trees to RTL.
5582 We do conversion per basic block and preserve/update the tree CFG.
5583 This implies we have to do some magic as the CFG can simultaneously
5584 consist of basic blocks containing RTL and GIMPLE trees. This can
5585 confuse the CFG hooks, so be careful to not manipulate CFG during
5586 the expansion. */
5588 namespace {
5590 const pass_data pass_data_expand =
5592 RTL_PASS, /* type */
5593 "expand", /* name */
5594 OPTGROUP_NONE, /* optinfo_flags */
5595 TV_EXPAND, /* tv_id */
5596 ( PROP_ssa | PROP_gimple_leh | PROP_cfg
5597 | PROP_gimple_lcx
5598 | PROP_gimple_lvec ), /* properties_required */
5599 PROP_rtl, /* properties_provided */
5600 ( PROP_ssa | PROP_trees ), /* properties_destroyed */
5601 0, /* todo_flags_start */
5602 0, /* todo_flags_finish */
5605 class pass_expand : public rtl_opt_pass
5607 public:
5608 pass_expand (gcc::context *ctxt)
5609 : rtl_opt_pass (pass_data_expand, ctxt)
5612 /* opt_pass methods: */
5613 virtual unsigned int execute (function *);
5615 }; // class pass_expand
5617 unsigned int
5618 pass_expand::execute (function *fun)
5620 basic_block bb, init_block;
5621 sbitmap blocks;
5622 edge_iterator ei;
5623 edge e;
5624 rtx_insn *var_seq, *var_ret_seq;
5625 unsigned i;
5627 timevar_push (TV_OUT_OF_SSA);
5628 rewrite_out_of_ssa (&SA);
5629 timevar_pop (TV_OUT_OF_SSA);
5630 SA.partition_to_pseudo = XCNEWVEC (rtx, SA.map->num_partitions);
5632 /* Make sure all values used by the optimization passes have sane
5633 defaults. */
5634 reg_renumber = 0;
5636 /* Some backends want to know that we are expanding to RTL. */
5637 currently_expanding_to_rtl = 1;
5638 /* Dominators are not kept up-to-date as we may create new basic-blocks. */
5639 free_dominance_info (CDI_DOMINATORS);
5641 rtl_profile_for_bb (ENTRY_BLOCK_PTR_FOR_FN (fun));
5643 insn_locations_init ();
5644 if (!DECL_IS_BUILTIN (current_function_decl))
5646 /* Eventually, all FEs should explicitly set function_start_locus. */
5647 if (LOCATION_LOCUS (fun->function_start_locus) == UNKNOWN_LOCATION)
5648 set_curr_insn_location
5649 (DECL_SOURCE_LOCATION (current_function_decl));
5650 else
5651 set_curr_insn_location (fun->function_start_locus);
5653 else
5654 set_curr_insn_location (UNKNOWN_LOCATION);
5655 prologue_location = curr_insn_location ();
5657 #ifdef INSN_SCHEDULING
5658 init_sched_attrs ();
5659 #endif
5661 /* Make sure first insn is a note even if we don't want linenums.
5662 This makes sure the first insn will never be deleted.
5663 Also, final expects a note to appear there. */
5664 emit_note (NOTE_INSN_DELETED);
5666 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
5667 discover_nonconstant_array_refs ();
5669 targetm.expand_to_rtl_hook ();
5670 crtl->stack_alignment_needed = STACK_BOUNDARY;
5671 crtl->max_used_stack_slot_alignment = STACK_BOUNDARY;
5672 crtl->stack_alignment_estimated = 0;
5673 crtl->preferred_stack_boundary = STACK_BOUNDARY;
5674 fun->cfg->max_jumptable_ents = 0;
5676 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
5677 of the function section at exapnsion time to predict distance of calls. */
5678 resolve_unique_section (current_function_decl, 0, flag_function_sections);
5680 /* Expand the variables recorded during gimple lowering. */
5681 timevar_push (TV_VAR_EXPAND);
5682 start_sequence ();
5684 var_ret_seq = expand_used_vars ();
5686 var_seq = get_insns ();
5687 end_sequence ();
5688 timevar_pop (TV_VAR_EXPAND);
5690 /* Honor stack protection warnings. */
5691 if (warn_stack_protect)
5693 if (fun->calls_alloca)
5694 warning (OPT_Wstack_protector,
5695 "stack protector not protecting local variables: "
5696 "variable length buffer");
5697 if (has_short_buffer && !crtl->stack_protect_guard)
5698 warning (OPT_Wstack_protector,
5699 "stack protector not protecting function: "
5700 "all local arrays are less than %d bytes long",
5701 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE));
5704 /* Set up parameters and prepare for return, for the function. */
5705 expand_function_start (current_function_decl);
5707 /* If we emitted any instructions for setting up the variables,
5708 emit them before the FUNCTION_START note. */
5709 if (var_seq)
5711 emit_insn_before (var_seq, parm_birth_insn);
5713 /* In expand_function_end we'll insert the alloca save/restore
5714 before parm_birth_insn. We've just insertted an alloca call.
5715 Adjust the pointer to match. */
5716 parm_birth_insn = var_seq;
5719 /* Now that we also have the parameter RTXs, copy them over to our
5720 partitions. */
5721 for (i = 0; i < SA.map->num_partitions; i++)
5723 tree var = SSA_NAME_VAR (partition_to_var (SA.map, i));
5725 if (TREE_CODE (var) != VAR_DECL
5726 && !SA.partition_to_pseudo[i])
5727 SA.partition_to_pseudo[i] = DECL_RTL_IF_SET (var);
5728 gcc_assert (SA.partition_to_pseudo[i]);
5730 /* If this decl was marked as living in multiple places, reset
5731 this now to NULL. */
5732 if (DECL_RTL_IF_SET (var) == pc_rtx)
5733 SET_DECL_RTL (var, NULL);
5735 /* Some RTL parts really want to look at DECL_RTL(x) when x
5736 was a decl marked in REG_ATTR or MEM_ATTR. We could use
5737 SET_DECL_RTL here making this available, but that would mean
5738 to select one of the potentially many RTLs for one DECL. Instead
5739 of doing that we simply reset the MEM_EXPR of the RTL in question,
5740 then nobody can get at it and hence nobody can call DECL_RTL on it. */
5741 if (!DECL_RTL_SET_P (var))
5743 if (MEM_P (SA.partition_to_pseudo[i]))
5744 set_mem_expr (SA.partition_to_pseudo[i], NULL);
5748 /* If we have a class containing differently aligned pointers
5749 we need to merge those into the corresponding RTL pointer
5750 alignment. */
5751 for (i = 1; i < num_ssa_names; i++)
5753 tree name = ssa_name (i);
5754 int part;
5755 rtx r;
5757 if (!name
5758 /* We might have generated new SSA names in
5759 update_alias_info_with_stack_vars. They will have a NULL
5760 defining statements, and won't be part of the partitioning,
5761 so ignore those. */
5762 || !SSA_NAME_DEF_STMT (name))
5763 continue;
5764 part = var_to_partition (SA.map, name);
5765 if (part == NO_PARTITION)
5766 continue;
5768 /* Adjust all partition members to get the underlying decl of
5769 the representative which we might have created in expand_one_var. */
5770 if (SSA_NAME_VAR (name) == NULL_TREE)
5772 tree leader = partition_to_var (SA.map, part);
5773 gcc_assert (SSA_NAME_VAR (leader) != NULL_TREE);
5774 replace_ssa_name_symbol (name, SSA_NAME_VAR (leader));
5776 if (!POINTER_TYPE_P (TREE_TYPE (name)))
5777 continue;
5779 r = SA.partition_to_pseudo[part];
5780 if (REG_P (r))
5781 mark_reg_pointer (r, get_pointer_alignment (name));
5784 /* If this function is `main', emit a call to `__main'
5785 to run global initializers, etc. */
5786 if (DECL_NAME (current_function_decl)
5787 && MAIN_NAME_P (DECL_NAME (current_function_decl))
5788 && DECL_FILE_SCOPE_P (current_function_decl))
5789 expand_main_function ();
5791 /* Initialize the stack_protect_guard field. This must happen after the
5792 call to __main (if any) so that the external decl is initialized. */
5793 if (crtl->stack_protect_guard)
5794 stack_protect_prologue ();
5796 expand_phi_nodes (&SA);
5798 /* Register rtl specific functions for cfg. */
5799 rtl_register_cfg_hooks ();
5801 init_block = construct_init_block ();
5803 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
5804 remaining edges later. */
5805 FOR_EACH_EDGE (e, ei, ENTRY_BLOCK_PTR_FOR_FN (fun)->succs)
5806 e->flags &= ~EDGE_EXECUTABLE;
5808 lab_rtx_for_bb = new hash_map<basic_block, rtx_code_label *>;
5809 FOR_BB_BETWEEN (bb, init_block->next_bb, EXIT_BLOCK_PTR_FOR_FN (fun),
5810 next_bb)
5811 bb = expand_gimple_basic_block (bb, var_ret_seq != NULL_RTX);
5813 if (MAY_HAVE_DEBUG_INSNS)
5814 expand_debug_locations ();
5816 /* Free stuff we no longer need after GIMPLE optimizations. */
5817 free_dominance_info (CDI_DOMINATORS);
5818 free_dominance_info (CDI_POST_DOMINATORS);
5819 delete_tree_cfg_annotations ();
5821 timevar_push (TV_OUT_OF_SSA);
5822 finish_out_of_ssa (&SA);
5823 timevar_pop (TV_OUT_OF_SSA);
5825 timevar_push (TV_POST_EXPAND);
5826 /* We are no longer in SSA form. */
5827 fun->gimple_df->in_ssa_p = false;
5828 loops_state_clear (LOOP_CLOSED_SSA);
5830 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
5831 conservatively to true until they are all profile aware. */
5832 delete lab_rtx_for_bb;
5833 free_histograms ();
5835 construct_exit_block ();
5836 insn_locations_finalize ();
5838 if (var_ret_seq)
5840 rtx_insn *after = return_label;
5841 rtx_insn *next = NEXT_INSN (after);
5842 if (next && NOTE_INSN_BASIC_BLOCK_P (next))
5843 after = next;
5844 emit_insn_after (var_ret_seq, after);
5847 /* Zap the tree EH table. */
5848 set_eh_throw_stmt_table (fun, NULL);
5850 /* We need JUMP_LABEL be set in order to redirect jumps, and hence
5851 split edges which edge insertions might do. */
5852 rebuild_jump_labels (get_insns ());
5854 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun),
5855 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
5857 edge e;
5858 edge_iterator ei;
5859 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
5861 if (e->insns.r)
5863 rebuild_jump_labels_chain (e->insns.r);
5864 /* Put insns after parm birth, but before
5865 NOTE_INSNS_FUNCTION_BEG. */
5866 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (fun)
5867 && single_succ_p (ENTRY_BLOCK_PTR_FOR_FN (fun)))
5869 rtx_insn *insns = e->insns.r;
5870 e->insns.r = NULL;
5871 if (NOTE_P (parm_birth_insn)
5872 && NOTE_KIND (parm_birth_insn) == NOTE_INSN_FUNCTION_BEG)
5873 emit_insn_before_noloc (insns, parm_birth_insn, e->dest);
5874 else
5875 emit_insn_after_noloc (insns, parm_birth_insn, e->dest);
5877 else
5878 commit_one_edge_insertion (e);
5880 else
5881 ei_next (&ei);
5885 /* We're done expanding trees to RTL. */
5886 currently_expanding_to_rtl = 0;
5888 FOR_BB_BETWEEN (bb, ENTRY_BLOCK_PTR_FOR_FN (fun)->next_bb,
5889 EXIT_BLOCK_PTR_FOR_FN (fun), next_bb)
5891 edge e;
5892 edge_iterator ei;
5893 for (ei = ei_start (bb->succs); (e = ei_safe_edge (ei)); )
5895 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
5896 e->flags &= ~EDGE_EXECUTABLE;
5898 /* At the moment not all abnormal edges match the RTL
5899 representation. It is safe to remove them here as
5900 find_many_sub_basic_blocks will rediscover them.
5901 In the future we should get this fixed properly. */
5902 if ((e->flags & EDGE_ABNORMAL)
5903 && !(e->flags & EDGE_SIBCALL))
5904 remove_edge (e);
5905 else
5906 ei_next (&ei);
5910 blocks = sbitmap_alloc (last_basic_block_for_fn (fun));
5911 bitmap_ones (blocks);
5912 find_many_sub_basic_blocks (blocks);
5913 sbitmap_free (blocks);
5914 purge_all_dead_edges ();
5916 expand_stack_alignment ();
5918 /* Fixup REG_EQUIV notes in the prologue if there are tailcalls in this
5919 function. */
5920 if (crtl->tail_call_emit)
5921 fixup_tail_calls ();
5923 /* After initial rtl generation, call back to finish generating
5924 exception support code. We need to do this before cleaning up
5925 the CFG as the code does not expect dead landing pads. */
5926 if (fun->eh->region_tree != NULL)
5927 finish_eh_generation ();
5929 /* Remove unreachable blocks, otherwise we cannot compute dominators
5930 which are needed for loop state verification. As a side-effect
5931 this also compacts blocks.
5932 ??? We cannot remove trivially dead insns here as for example
5933 the DRAP reg on i?86 is not magically live at this point.
5934 gcc.c-torture/execute/ipa-sra-2.c execution, -Os -m32 fails otherwise. */
5935 cleanup_cfg (CLEANUP_NO_INSN_DEL);
5937 #ifdef ENABLE_CHECKING
5938 verify_flow_info ();
5939 #endif
5941 /* Initialize pseudos allocated for hard registers. */
5942 emit_initial_value_sets ();
5944 /* And finally unshare all RTL. */
5945 unshare_all_rtl ();
5947 /* There's no need to defer outputting this function any more; we
5948 know we want to output it. */
5949 DECL_DEFER_OUTPUT (current_function_decl) = 0;
5951 /* Now that we're done expanding trees to RTL, we shouldn't have any
5952 more CONCATs anywhere. */
5953 generating_concat_p = 0;
5955 if (dump_file)
5957 fprintf (dump_file,
5958 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
5959 /* And the pass manager will dump RTL for us. */
5962 /* If we're emitting a nested function, make sure its parent gets
5963 emitted as well. Doing otherwise confuses debug info. */
5965 tree parent;
5966 for (parent = DECL_CONTEXT (current_function_decl);
5967 parent != NULL_TREE;
5968 parent = get_containing_scope (parent))
5969 if (TREE_CODE (parent) == FUNCTION_DECL)
5970 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent)) = 1;
5973 /* We are now committed to emitting code for this function. Do any
5974 preparation, such as emitting abstract debug info for the inline
5975 before it gets mangled by optimization. */
5976 if (cgraph_function_possibly_inlined_p (current_function_decl))
5977 (*debug_hooks->outlining_inline_function) (current_function_decl);
5979 TREE_ASM_WRITTEN (current_function_decl) = 1;
5981 /* After expanding, the return labels are no longer needed. */
5982 return_label = NULL;
5983 naked_return_label = NULL;
5985 /* After expanding, the tm_restart map is no longer needed. */
5986 if (fun->gimple_df->tm_restart)
5988 htab_delete (fun->gimple_df->tm_restart);
5989 fun->gimple_df->tm_restart = NULL;
5992 /* Tag the blocks with a depth number so that change_scope can find
5993 the common parent easily. */
5994 set_block_levels (DECL_INITIAL (fun->decl), 0);
5995 default_rtl_profile ();
5997 timevar_pop (TV_POST_EXPAND);
5999 return 0;
6002 } // anon namespace
6004 rtl_opt_pass *
6005 make_pass_expand (gcc::context *ctxt)
6007 return new pass_expand (ctxt);