1 /* A pass for lowering trees to RTL.
2 Copyright (C) 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011
3 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
23 #include "coretypes.h"
28 #include "basic-block.h"
31 #include "langhooks.h"
32 #include "tree-flow.h"
34 #include "tree-dump.h"
35 #include "tree-pass.h"
38 #include "diagnostic.h"
39 #include "tree-pretty-print.h"
40 #include "gimple-pretty-print.h"
44 #include "tree-inline.h"
45 #include "value-prof.h"
47 #include "ssaexpand.h"
50 #include "insn-attr.h" /* For INSN_SCHEDULING. */
52 /* This variable holds information helping the rewriting of SSA trees
56 /* This variable holds the currently expanded gimple statement for purposes
57 of comminucating the profile info to the builtin expanders. */
58 gimple currently_expanding_gimple_stmt
;
60 /* Return an expression tree corresponding to the RHS of GIMPLE
64 gimple_assign_rhs_to_tree (gimple stmt
)
67 enum gimple_rhs_class grhs_class
;
69 grhs_class
= get_gimple_rhs_class (gimple_expr_code (stmt
));
71 if (grhs_class
== GIMPLE_TERNARY_RHS
)
72 t
= build3 (gimple_assign_rhs_code (stmt
),
73 TREE_TYPE (gimple_assign_lhs (stmt
)),
74 gimple_assign_rhs1 (stmt
),
75 gimple_assign_rhs2 (stmt
),
76 gimple_assign_rhs3 (stmt
));
77 else if (grhs_class
== GIMPLE_BINARY_RHS
)
78 t
= build2 (gimple_assign_rhs_code (stmt
),
79 TREE_TYPE (gimple_assign_lhs (stmt
)),
80 gimple_assign_rhs1 (stmt
),
81 gimple_assign_rhs2 (stmt
));
82 else if (grhs_class
== GIMPLE_UNARY_RHS
)
83 t
= build1 (gimple_assign_rhs_code (stmt
),
84 TREE_TYPE (gimple_assign_lhs (stmt
)),
85 gimple_assign_rhs1 (stmt
));
86 else if (grhs_class
== GIMPLE_SINGLE_RHS
)
88 t
= gimple_assign_rhs1 (stmt
);
89 /* Avoid modifying this tree in place below. */
90 if ((gimple_has_location (stmt
) && CAN_HAVE_LOCATION_P (t
)
91 && gimple_location (stmt
) != EXPR_LOCATION (t
))
92 || (gimple_block (stmt
)
93 && currently_expanding_to_rtl
95 && gimple_block (stmt
) != TREE_BLOCK (t
)))
101 if (gimple_has_location (stmt
) && CAN_HAVE_LOCATION_P (t
))
102 SET_EXPR_LOCATION (t
, gimple_location (stmt
));
103 if (gimple_block (stmt
) && currently_expanding_to_rtl
&& EXPR_P (t
))
104 TREE_BLOCK (t
) = gimple_block (stmt
);
110 #ifndef STACK_ALIGNMENT_NEEDED
111 #define STACK_ALIGNMENT_NEEDED 1
114 #define SSAVAR(x) (TREE_CODE (x) == SSA_NAME ? SSA_NAME_VAR (x) : x)
116 /* Associate declaration T with storage space X. If T is no
117 SSA name this is exactly SET_DECL_RTL, otherwise make the
118 partition of T associated with X. */
120 set_rtl (tree t
, rtx x
)
122 if (TREE_CODE (t
) == SSA_NAME
)
124 SA
.partition_to_pseudo
[var_to_partition (SA
.map
, t
)] = x
;
126 set_reg_attrs_for_decl_rtl (SSA_NAME_VAR (t
), x
);
127 /* For the benefit of debug information at -O0 (where vartracking
128 doesn't run) record the place also in the base DECL if it's
129 a normal variable (not a parameter). */
130 if (x
&& x
!= pc_rtx
&& TREE_CODE (SSA_NAME_VAR (t
)) == VAR_DECL
)
132 tree var
= SSA_NAME_VAR (t
);
133 /* If we don't yet have something recorded, just record it now. */
134 if (!DECL_RTL_SET_P (var
))
135 SET_DECL_RTL (var
, x
);
136 /* If we have it set alrady to "multiple places" don't
138 else if (DECL_RTL (var
) == pc_rtx
)
140 /* If we have something recorded and it's not the same place
141 as we want to record now, we have multiple partitions for the
142 same base variable, with different places. We can't just
143 randomly chose one, hence we have to say that we don't know.
144 This only happens with optimization, and there var-tracking
145 will figure out the right thing. */
146 else if (DECL_RTL (var
) != x
)
147 SET_DECL_RTL (var
, pc_rtx
);
154 /* This structure holds data relevant to one variable that will be
155 placed in a stack slot. */
161 /* The offset of the variable. During partitioning, this is the
162 offset relative to the partition. After partitioning, this
163 is relative to the stack frame. */
164 HOST_WIDE_INT offset
;
166 /* Initially, the size of the variable. Later, the size of the partition,
167 if this variable becomes it's partition's representative. */
170 /* The *byte* alignment required for this variable. Or as, with the
171 size, the alignment for this partition. */
174 /* The partition representative. */
175 size_t representative
;
177 /* The next stack variable in the partition, or EOC. */
180 /* The numbers of conflicting stack variables. */
184 #define EOC ((size_t)-1)
186 /* We have an array of such objects while deciding allocation. */
187 static struct stack_var
*stack_vars
;
188 static size_t stack_vars_alloc
;
189 static size_t stack_vars_num
;
191 /* An array of indices such that stack_vars[stack_vars_sorted[i]].size
192 is non-decreasing. */
193 static size_t *stack_vars_sorted
;
195 /* The phase of the stack frame. This is the known misalignment of
196 virtual_stack_vars_rtx from PREFERRED_STACK_BOUNDARY. That is,
197 (frame_offset+frame_phase) % PREFERRED_STACK_BOUNDARY == 0. */
198 static int frame_phase
;
200 /* Used during expand_used_vars to remember if we saw any decls for
201 which we'd like to enable stack smashing protection. */
202 static bool has_protected_decls
;
204 /* Used during expand_used_vars. Remember if we say a character buffer
205 smaller than our cutoff threshold. Used for -Wstack-protector. */
206 static bool has_short_buffer
;
208 /* Discover the byte alignment to use for DECL. Ignore alignment
209 we can't do with expected alignment of the stack boundary. */
212 get_decl_align_unit (tree decl
)
214 unsigned int align
= LOCAL_DECL_ALIGNMENT (decl
);
215 return align
/ BITS_PER_UNIT
;
218 /* Allocate SIZE bytes at byte alignment ALIGN from the stack frame.
219 Return the frame offset. */
222 alloc_stack_frame_space (HOST_WIDE_INT size
, unsigned HOST_WIDE_INT align
)
224 HOST_WIDE_INT offset
, new_frame_offset
;
226 new_frame_offset
= frame_offset
;
227 if (FRAME_GROWS_DOWNWARD
)
229 new_frame_offset
-= size
+ frame_phase
;
230 new_frame_offset
&= -align
;
231 new_frame_offset
+= frame_phase
;
232 offset
= new_frame_offset
;
236 new_frame_offset
-= frame_phase
;
237 new_frame_offset
+= align
- 1;
238 new_frame_offset
&= -align
;
239 new_frame_offset
+= frame_phase
;
240 offset
= new_frame_offset
;
241 new_frame_offset
+= size
;
243 frame_offset
= new_frame_offset
;
245 if (frame_offset_overflow (frame_offset
, cfun
->decl
))
246 frame_offset
= offset
= 0;
251 /* Accumulate DECL into STACK_VARS. */
254 add_stack_var (tree decl
)
258 if (stack_vars_num
>= stack_vars_alloc
)
260 if (stack_vars_alloc
)
261 stack_vars_alloc
= stack_vars_alloc
* 3 / 2;
263 stack_vars_alloc
= 32;
265 = XRESIZEVEC (struct stack_var
, stack_vars
, stack_vars_alloc
);
267 v
= &stack_vars
[stack_vars_num
];
271 v
->size
= tree_low_cst (DECL_SIZE_UNIT (SSAVAR (decl
)), 1);
272 /* Ensure that all variables have size, so that &a != &b for any two
273 variables that are simultaneously live. */
276 v
->alignb
= get_decl_align_unit (SSAVAR (decl
));
278 /* All variables are initially in their own partition. */
279 v
->representative
= stack_vars_num
;
282 /* All variables initially conflict with no other. */
285 /* Ensure that this decl doesn't get put onto the list twice. */
286 set_rtl (decl
, pc_rtx
);
291 /* Make the decls associated with luid's X and Y conflict. */
294 add_stack_var_conflict (size_t x
, size_t y
)
296 struct stack_var
*a
= &stack_vars
[x
];
297 struct stack_var
*b
= &stack_vars
[y
];
299 a
->conflicts
= BITMAP_ALLOC (NULL
);
301 b
->conflicts
= BITMAP_ALLOC (NULL
);
302 bitmap_set_bit (a
->conflicts
, y
);
303 bitmap_set_bit (b
->conflicts
, x
);
306 /* Check whether the decls associated with luid's X and Y conflict. */
309 stack_var_conflict_p (size_t x
, size_t y
)
311 struct stack_var
*a
= &stack_vars
[x
];
312 struct stack_var
*b
= &stack_vars
[y
];
313 if (!a
->conflicts
|| !b
->conflicts
)
315 return bitmap_bit_p (a
->conflicts
, y
);
318 /* Returns true if TYPE is or contains a union type. */
321 aggregate_contains_union_type (tree type
)
325 if (TREE_CODE (type
) == UNION_TYPE
326 || TREE_CODE (type
) == QUAL_UNION_TYPE
)
328 if (TREE_CODE (type
) == ARRAY_TYPE
)
329 return aggregate_contains_union_type (TREE_TYPE (type
));
330 if (TREE_CODE (type
) != RECORD_TYPE
)
333 for (field
= TYPE_FIELDS (type
); field
; field
= DECL_CHAIN (field
))
334 if (TREE_CODE (field
) == FIELD_DECL
)
335 if (aggregate_contains_union_type (TREE_TYPE (field
)))
341 /* A subroutine of expand_used_vars. If two variables X and Y have alias
342 sets that do not conflict, then do add a conflict for these variables
343 in the interference graph. We also need to make sure to add conflicts
344 for union containing structures. Else RTL alias analysis comes along
345 and due to type based aliasing rules decides that for two overlapping
346 union temporaries { short s; int i; } accesses to the same mem through
347 different types may not alias and happily reorders stores across
348 life-time boundaries of the temporaries (See PR25654).
349 We also have to mind MEM_IN_STRUCT_P and MEM_SCALAR_P. */
352 add_alias_set_conflicts (void)
354 size_t i
, j
, n
= stack_vars_num
;
356 for (i
= 0; i
< n
; ++i
)
358 tree type_i
= TREE_TYPE (stack_vars
[i
].decl
);
359 bool aggr_i
= AGGREGATE_TYPE_P (type_i
);
362 contains_union
= aggregate_contains_union_type (type_i
);
363 for (j
= 0; j
< i
; ++j
)
365 tree type_j
= TREE_TYPE (stack_vars
[j
].decl
);
366 bool aggr_j
= AGGREGATE_TYPE_P (type_j
);
368 /* Either the objects conflict by means of type based
369 aliasing rules, or we need to add a conflict. */
370 || !objects_must_conflict_p (type_i
, type_j
)
371 /* In case the types do not conflict ensure that access
372 to elements will conflict. In case of unions we have
373 to be careful as type based aliasing rules may say
374 access to the same memory does not conflict. So play
375 safe and add a conflict in this case. */
377 add_stack_var_conflict (i
, j
);
382 /* A subroutine of partition_stack_vars. A comparison function for qsort,
383 sorting an array of indices by the properties of the object. */
386 stack_var_cmp (const void *a
, const void *b
)
388 size_t ia
= *(const size_t *)a
;
389 size_t ib
= *(const size_t *)b
;
390 unsigned int aligna
= stack_vars
[ia
].alignb
;
391 unsigned int alignb
= stack_vars
[ib
].alignb
;
392 HOST_WIDE_INT sizea
= stack_vars
[ia
].size
;
393 HOST_WIDE_INT sizeb
= stack_vars
[ib
].size
;
394 tree decla
= stack_vars
[ia
].decl
;
395 tree declb
= stack_vars
[ib
].decl
;
397 unsigned int uida
, uidb
;
399 /* Primary compare on "large" alignment. Large comes first. */
400 largea
= (aligna
* BITS_PER_UNIT
> MAX_SUPPORTED_STACK_ALIGNMENT
);
401 largeb
= (alignb
* BITS_PER_UNIT
> MAX_SUPPORTED_STACK_ALIGNMENT
);
402 if (largea
!= largeb
)
403 return (int)largeb
- (int)largea
;
405 /* Secondary compare on size, decreasing */
411 /* Tertiary compare on true alignment, decreasing. */
417 /* Final compare on ID for sort stability, increasing.
418 Two SSA names are compared by their version, SSA names come before
419 non-SSA names, and two normal decls are compared by their DECL_UID. */
420 if (TREE_CODE (decla
) == SSA_NAME
)
422 if (TREE_CODE (declb
) == SSA_NAME
)
423 uida
= SSA_NAME_VERSION (decla
), uidb
= SSA_NAME_VERSION (declb
);
427 else if (TREE_CODE (declb
) == SSA_NAME
)
430 uida
= DECL_UID (decla
), uidb
= DECL_UID (declb
);
439 /* If the points-to solution *PI points to variables that are in a partition
440 together with other variables add all partition members to the pointed-to
444 add_partitioned_vars_to_ptset (struct pt_solution
*pt
,
445 struct pointer_map_t
*decls_to_partitions
,
446 struct pointer_set_t
*visited
, bitmap temp
)
454 /* The pointed-to vars bitmap is shared, it is enough to
456 || pointer_set_insert(visited
, pt
->vars
))
461 /* By using a temporary bitmap to store all members of the partitions
462 we have to add we make sure to visit each of the partitions only
464 EXECUTE_IF_SET_IN_BITMAP (pt
->vars
, 0, i
, bi
)
466 || !bitmap_bit_p (temp
, i
))
467 && (part
= (bitmap
*) pointer_map_contains (decls_to_partitions
,
468 (void *)(size_t) i
)))
469 bitmap_ior_into (temp
, *part
);
470 if (!bitmap_empty_p (temp
))
471 bitmap_ior_into (pt
->vars
, temp
);
474 /* Update points-to sets based on partition info, so we can use them on RTL.
475 The bitmaps representing stack partitions will be saved until expand,
476 where partitioned decls used as bases in memory expressions will be
480 update_alias_info_with_stack_vars (void)
482 struct pointer_map_t
*decls_to_partitions
= NULL
;
484 tree var
= NULL_TREE
;
486 for (i
= 0; i
< stack_vars_num
; i
++)
490 struct ptr_info_def
*pi
;
492 /* Not interested in partitions with single variable. */
493 if (stack_vars
[i
].representative
!= i
494 || stack_vars
[i
].next
== EOC
)
497 if (!decls_to_partitions
)
499 decls_to_partitions
= pointer_map_create ();
500 cfun
->gimple_df
->decls_to_pointers
= pointer_map_create ();
503 /* Create an SSA_NAME that points to the partition for use
504 as base during alias-oracle queries on RTL for bases that
505 have been partitioned. */
506 if (var
== NULL_TREE
)
507 var
= create_tmp_var (ptr_type_node
, NULL
);
508 name
= make_ssa_name (var
, NULL
);
510 /* Create bitmaps representing partitions. They will be used for
511 points-to sets later, so use GGC alloc. */
512 part
= BITMAP_GGC_ALLOC ();
513 for (j
= i
; j
!= EOC
; j
= stack_vars
[j
].next
)
515 tree decl
= stack_vars
[j
].decl
;
516 unsigned int uid
= DECL_PT_UID (decl
);
517 /* We should never end up partitioning SSA names (though they
518 may end up on the stack). Neither should we allocate stack
519 space to something that is unused and thus unreferenced, except
520 for -O0 where we are preserving even unreferenced variables. */
521 gcc_assert (DECL_P (decl
)
523 || referenced_var_lookup (DECL_UID (decl
))));
524 bitmap_set_bit (part
, uid
);
525 *((bitmap
*) pointer_map_insert (decls_to_partitions
,
526 (void *)(size_t) uid
)) = part
;
527 *((tree
*) pointer_map_insert (cfun
->gimple_df
->decls_to_pointers
,
531 /* Make the SSA name point to all partition members. */
532 pi
= get_ptr_info (name
);
533 pt_solution_set (&pi
->pt
, part
, false, false);
536 /* Make all points-to sets that contain one member of a partition
537 contain all members of the partition. */
538 if (decls_to_partitions
)
541 struct pointer_set_t
*visited
= pointer_set_create ();
542 bitmap temp
= BITMAP_ALLOC (NULL
);
544 for (i
= 1; i
< num_ssa_names
; i
++)
546 tree name
= ssa_name (i
);
547 struct ptr_info_def
*pi
;
550 && POINTER_TYPE_P (TREE_TYPE (name
))
551 && ((pi
= SSA_NAME_PTR_INFO (name
)) != NULL
))
552 add_partitioned_vars_to_ptset (&pi
->pt
, decls_to_partitions
,
556 add_partitioned_vars_to_ptset (&cfun
->gimple_df
->escaped
,
557 decls_to_partitions
, visited
, temp
);
559 pointer_set_destroy (visited
);
560 pointer_map_destroy (decls_to_partitions
);
565 /* A subroutine of partition_stack_vars. The UNION portion of a UNION/FIND
566 partitioning algorithm. Partitions A and B are known to be non-conflicting.
567 Merge them into a single partition A.
569 At the same time, add OFFSET to all variables in partition B. At the end
570 of the partitioning process we've have a nice block easy to lay out within
574 union_stack_vars (size_t a
, size_t b
, HOST_WIDE_INT offset
)
577 struct stack_var
*vb
= &stack_vars
[b
];
581 /* Update each element of partition B with the given offset,
582 and merge them into partition A. */
583 for (last
= i
= b
; i
!= EOC
; last
= i
, i
= stack_vars
[i
].next
)
585 stack_vars
[i
].offset
+= offset
;
586 stack_vars
[i
].representative
= a
;
588 stack_vars
[last
].next
= stack_vars
[a
].next
;
589 stack_vars
[a
].next
= b
;
591 /* Update the required alignment of partition A to account for B. */
592 if (stack_vars
[a
].alignb
< stack_vars
[b
].alignb
)
593 stack_vars
[a
].alignb
= stack_vars
[b
].alignb
;
595 /* Update the interference graph and merge the conflicts. */
598 EXECUTE_IF_SET_IN_BITMAP (vb
->conflicts
, 0, u
, bi
)
599 add_stack_var_conflict (a
, stack_vars
[u
].representative
);
600 BITMAP_FREE (vb
->conflicts
);
604 /* A subroutine of expand_used_vars. Binpack the variables into
605 partitions constrained by the interference graph. The overall
606 algorithm used is as follows:
608 Sort the objects by size.
613 Look for the largest non-conflicting object B with size <= S.
623 partition_stack_vars (void)
625 size_t si
, sj
, n
= stack_vars_num
;
627 stack_vars_sorted
= XNEWVEC (size_t, stack_vars_num
);
628 for (si
= 0; si
< n
; ++si
)
629 stack_vars_sorted
[si
] = si
;
634 qsort (stack_vars_sorted
, n
, sizeof (size_t), stack_var_cmp
);
636 for (si
= 0; si
< n
; ++si
)
638 size_t i
= stack_vars_sorted
[si
];
639 HOST_WIDE_INT isize
= stack_vars
[i
].size
;
640 unsigned int ialign
= stack_vars
[i
].alignb
;
641 HOST_WIDE_INT offset
= 0;
643 for (sj
= si
; sj
-- > 0; )
645 size_t j
= stack_vars_sorted
[sj
];
646 HOST_WIDE_INT jsize
= stack_vars
[j
].size
;
647 unsigned int jalign
= stack_vars
[j
].alignb
;
649 /* Ignore objects that aren't partition representatives. */
650 if (stack_vars
[j
].representative
!= j
)
653 /* Ignore objects too large for the remaining space. */
657 /* Ignore conflicting objects. */
658 if (stack_var_conflict_p (i
, j
))
661 /* Do not mix objects of "small" (supported) alignment
662 and "large" (unsupported) alignment. */
663 if ((ialign
* BITS_PER_UNIT
<= MAX_SUPPORTED_STACK_ALIGNMENT
)
664 != (jalign
* BITS_PER_UNIT
<= MAX_SUPPORTED_STACK_ALIGNMENT
))
667 /* Refine the remaining space check to include alignment. */
668 if (offset
& (jalign
- 1))
670 HOST_WIDE_INT toff
= offset
;
672 toff
&= -(HOST_WIDE_INT
)jalign
;
673 if (isize
- (toff
- offset
) < jsize
)
676 isize
-= toff
- offset
;
680 /* UNION the objects, placing J at OFFSET. */
681 union_stack_vars (i
, j
, offset
);
689 update_alias_info_with_stack_vars ();
692 /* A debugging aid for expand_used_vars. Dump the generated partitions. */
695 dump_stack_var_partition (void)
697 size_t si
, i
, j
, n
= stack_vars_num
;
699 for (si
= 0; si
< n
; ++si
)
701 i
= stack_vars_sorted
[si
];
703 /* Skip variables that aren't partition representatives, for now. */
704 if (stack_vars
[i
].representative
!= i
)
707 fprintf (dump_file
, "Partition %lu: size " HOST_WIDE_INT_PRINT_DEC
708 " align %u\n", (unsigned long) i
, stack_vars
[i
].size
,
709 stack_vars
[i
].alignb
);
711 for (j
= i
; j
!= EOC
; j
= stack_vars
[j
].next
)
713 fputc ('\t', dump_file
);
714 print_generic_expr (dump_file
, stack_vars
[j
].decl
, dump_flags
);
715 fprintf (dump_file
, ", offset " HOST_WIDE_INT_PRINT_DEC
"\n",
716 stack_vars
[j
].offset
);
721 /* Assign rtl to DECL at BASE + OFFSET. */
724 expand_one_stack_var_at (tree decl
, rtx base
, unsigned base_align
,
725 HOST_WIDE_INT offset
)
730 /* If this fails, we've overflowed the stack frame. Error nicely? */
731 gcc_assert (offset
== trunc_int_for_mode (offset
, Pmode
));
733 x
= plus_constant (base
, offset
);
734 x
= gen_rtx_MEM (DECL_MODE (SSAVAR (decl
)), x
);
736 if (TREE_CODE (decl
) != SSA_NAME
)
738 /* Set alignment we actually gave this decl if it isn't an SSA name.
739 If it is we generate stack slots only accidentally so it isn't as
740 important, we'll simply use the alignment that is already set. */
741 if (base
== virtual_stack_vars_rtx
)
742 offset
-= frame_phase
;
743 align
= offset
& -offset
;
744 align
*= BITS_PER_UNIT
;
745 if (align
== 0 || align
> base_align
)
748 /* One would think that we could assert that we're not decreasing
749 alignment here, but (at least) the i386 port does exactly this
750 via the MINIMUM_ALIGNMENT hook. */
752 DECL_ALIGN (decl
) = align
;
753 DECL_USER_ALIGN (decl
) = 0;
756 set_mem_attributes (x
, SSAVAR (decl
), true);
760 /* A subroutine of expand_used_vars. Give each partition representative
761 a unique location within the stack frame. Update each partition member
762 with that location. */
765 expand_stack_vars (bool (*pred
) (tree
))
767 size_t si
, i
, j
, n
= stack_vars_num
;
768 HOST_WIDE_INT large_size
= 0, large_alloc
= 0;
769 rtx large_base
= NULL
;
770 unsigned large_align
= 0;
773 /* Determine if there are any variables requiring "large" alignment.
774 Since these are dynamically allocated, we only process these if
775 no predicate involved. */
776 large_align
= stack_vars
[stack_vars_sorted
[0]].alignb
* BITS_PER_UNIT
;
777 if (pred
== NULL
&& large_align
> MAX_SUPPORTED_STACK_ALIGNMENT
)
779 /* Find the total size of these variables. */
780 for (si
= 0; si
< n
; ++si
)
784 i
= stack_vars_sorted
[si
];
785 alignb
= stack_vars
[i
].alignb
;
787 /* Stop when we get to the first decl with "small" alignment. */
788 if (alignb
* BITS_PER_UNIT
<= MAX_SUPPORTED_STACK_ALIGNMENT
)
791 /* Skip variables that aren't partition representatives. */
792 if (stack_vars
[i
].representative
!= i
)
795 /* Skip variables that have already had rtl assigned. See also
796 add_stack_var where we perpetrate this pc_rtx hack. */
797 decl
= stack_vars
[i
].decl
;
798 if ((TREE_CODE (decl
) == SSA_NAME
799 ? SA
.partition_to_pseudo
[var_to_partition (SA
.map
, decl
)]
800 : DECL_RTL (decl
)) != pc_rtx
)
803 large_size
+= alignb
- 1;
804 large_size
&= -(HOST_WIDE_INT
)alignb
;
805 large_size
+= stack_vars
[i
].size
;
808 /* If there were any, allocate space. */
810 large_base
= allocate_dynamic_stack_space (GEN_INT (large_size
), 0,
814 for (si
= 0; si
< n
; ++si
)
817 unsigned base_align
, alignb
;
818 HOST_WIDE_INT offset
;
820 i
= stack_vars_sorted
[si
];
822 /* Skip variables that aren't partition representatives, for now. */
823 if (stack_vars
[i
].representative
!= i
)
826 /* Skip variables that have already had rtl assigned. See also
827 add_stack_var where we perpetrate this pc_rtx hack. */
828 decl
= stack_vars
[i
].decl
;
829 if ((TREE_CODE (decl
) == SSA_NAME
830 ? SA
.partition_to_pseudo
[var_to_partition (SA
.map
, decl
)]
831 : DECL_RTL (decl
)) != pc_rtx
)
834 /* Check the predicate to see whether this variable should be
835 allocated in this pass. */
836 if (pred
&& !pred (decl
))
839 alignb
= stack_vars
[i
].alignb
;
840 if (alignb
* BITS_PER_UNIT
<= MAX_SUPPORTED_STACK_ALIGNMENT
)
842 offset
= alloc_stack_frame_space (stack_vars
[i
].size
, alignb
);
843 base
= virtual_stack_vars_rtx
;
844 base_align
= crtl
->max_used_stack_slot_alignment
;
848 /* Large alignment is only processed in the last pass. */
851 gcc_assert (large_base
!= NULL
);
853 large_alloc
+= alignb
- 1;
854 large_alloc
&= -(HOST_WIDE_INT
)alignb
;
855 offset
= large_alloc
;
856 large_alloc
+= stack_vars
[i
].size
;
859 base_align
= large_align
;
862 /* Create rtl for each variable based on their location within the
864 for (j
= i
; j
!= EOC
; j
= stack_vars
[j
].next
)
866 gcc_assert (stack_vars
[j
].offset
<= stack_vars
[i
].size
);
867 expand_one_stack_var_at (stack_vars
[j
].decl
,
869 stack_vars
[j
].offset
+ offset
);
873 gcc_assert (large_alloc
== large_size
);
876 /* Take into account all sizes of partitions and reset DECL_RTLs. */
878 account_stack_vars (void)
880 size_t si
, j
, i
, n
= stack_vars_num
;
881 HOST_WIDE_INT size
= 0;
883 for (si
= 0; si
< n
; ++si
)
885 i
= stack_vars_sorted
[si
];
887 /* Skip variables that aren't partition representatives, for now. */
888 if (stack_vars
[i
].representative
!= i
)
891 size
+= stack_vars
[i
].size
;
892 for (j
= i
; j
!= EOC
; j
= stack_vars
[j
].next
)
893 set_rtl (stack_vars
[j
].decl
, NULL
);
898 /* A subroutine of expand_one_var. Called to immediately assign rtl
899 to a variable to be allocated in the stack frame. */
902 expand_one_stack_var (tree var
)
904 HOST_WIDE_INT size
, offset
;
907 size
= tree_low_cst (DECL_SIZE_UNIT (SSAVAR (var
)), 1);
908 byte_align
= get_decl_align_unit (SSAVAR (var
));
910 /* We handle highly aligned variables in expand_stack_vars. */
911 gcc_assert (byte_align
* BITS_PER_UNIT
<= MAX_SUPPORTED_STACK_ALIGNMENT
);
913 offset
= alloc_stack_frame_space (size
, byte_align
);
915 expand_one_stack_var_at (var
, virtual_stack_vars_rtx
,
916 crtl
->max_used_stack_slot_alignment
, offset
);
919 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
920 that will reside in a hard register. */
923 expand_one_hard_reg_var (tree var
)
925 rest_of_decl_compilation (var
, 0, 0);
928 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL
929 that will reside in a pseudo register. */
932 expand_one_register_var (tree var
)
934 tree decl
= SSAVAR (var
);
935 tree type
= TREE_TYPE (decl
);
936 enum machine_mode reg_mode
= promote_decl_mode (decl
, NULL
);
937 rtx x
= gen_reg_rtx (reg_mode
);
941 /* Note if the object is a user variable. */
942 if (!DECL_ARTIFICIAL (decl
))
945 if (POINTER_TYPE_P (type
))
946 mark_reg_pointer (x
, TYPE_ALIGN (TREE_TYPE (type
)));
949 /* A subroutine of expand_one_var. Called to assign rtl to a VAR_DECL that
950 has some associated error, e.g. its type is error-mark. We just need
951 to pick something that won't crash the rest of the compiler. */
954 expand_one_error_var (tree var
)
956 enum machine_mode mode
= DECL_MODE (var
);
960 x
= gen_rtx_MEM (BLKmode
, const0_rtx
);
961 else if (mode
== VOIDmode
)
964 x
= gen_reg_rtx (mode
);
966 SET_DECL_RTL (var
, x
);
969 /* A subroutine of expand_one_var. VAR is a variable that will be
970 allocated to the local stack frame. Return true if we wish to
971 add VAR to STACK_VARS so that it will be coalesced with other
972 variables. Return false to allocate VAR immediately.
974 This function is used to reduce the number of variables considered
975 for coalescing, which reduces the size of the quadratic problem. */
978 defer_stack_allocation (tree var
, bool toplevel
)
980 /* If stack protection is enabled, *all* stack variables must be deferred,
981 so that we can re-order the strings to the top of the frame. */
982 if (flag_stack_protect
)
985 /* We handle "large" alignment via dynamic allocation. We want to handle
986 this extra complication in only one place, so defer them. */
987 if (DECL_ALIGN (var
) > MAX_SUPPORTED_STACK_ALIGNMENT
)
990 /* Variables in the outermost scope automatically conflict with
991 every other variable. The only reason to want to defer them
992 at all is that, after sorting, we can more efficiently pack
993 small variables in the stack frame. Continue to defer at -O2. */
994 if (toplevel
&& optimize
< 2)
997 /* Without optimization, *most* variables are allocated from the
998 stack, which makes the quadratic problem large exactly when we
999 want compilation to proceed as quickly as possible. On the
1000 other hand, we don't want the function's stack frame size to
1001 get completely out of hand. So we avoid adding scalars and
1002 "small" aggregates to the list at all. */
1003 if (optimize
== 0 && tree_low_cst (DECL_SIZE_UNIT (var
), 1) < 32)
1009 /* A subroutine of expand_used_vars. Expand one variable according to
1010 its flavor. Variables to be placed on the stack are not actually
1011 expanded yet, merely recorded.
1012 When REALLY_EXPAND is false, only add stack values to be allocated.
1013 Return stack usage this variable is supposed to take.
1016 static HOST_WIDE_INT
1017 expand_one_var (tree var
, bool toplevel
, bool really_expand
)
1019 unsigned int align
= BITS_PER_UNIT
;
1024 if (TREE_TYPE (var
) != error_mark_node
&& TREE_CODE (var
) == VAR_DECL
)
1026 /* Because we don't know if VAR will be in register or on stack,
1027 we conservatively assume it will be on stack even if VAR is
1028 eventually put into register after RA pass. For non-automatic
1029 variables, which won't be on stack, we collect alignment of
1030 type and ignore user specified alignment. */
1031 if (TREE_STATIC (var
) || DECL_EXTERNAL (var
))
1032 align
= MINIMUM_ALIGNMENT (TREE_TYPE (var
),
1033 TYPE_MODE (TREE_TYPE (var
)),
1034 TYPE_ALIGN (TREE_TYPE (var
)));
1035 else if (DECL_HAS_VALUE_EXPR_P (var
)
1036 || (DECL_RTL_SET_P (var
) && MEM_P (DECL_RTL (var
))))
1037 /* Don't consider debug only variables with DECL_HAS_VALUE_EXPR_P set
1038 or variables which were assigned a stack slot already by
1039 expand_one_stack_var_at - in the latter case DECL_ALIGN has been
1040 changed from the offset chosen to it. */
1041 align
= crtl
->stack_alignment_estimated
;
1043 align
= MINIMUM_ALIGNMENT (var
, DECL_MODE (var
), DECL_ALIGN (var
));
1045 /* If the variable alignment is very large we'll dynamicaly allocate
1046 it, which means that in-frame portion is just a pointer. */
1047 if (align
> MAX_SUPPORTED_STACK_ALIGNMENT
)
1048 align
= POINTER_SIZE
;
1051 if (SUPPORTS_STACK_ALIGNMENT
1052 && crtl
->stack_alignment_estimated
< align
)
1054 /* stack_alignment_estimated shouldn't change after stack
1055 realign decision made */
1056 gcc_assert(!crtl
->stack_realign_processed
);
1057 crtl
->stack_alignment_estimated
= align
;
1060 /* stack_alignment_needed > PREFERRED_STACK_BOUNDARY is permitted.
1061 So here we only make sure stack_alignment_needed >= align. */
1062 if (crtl
->stack_alignment_needed
< align
)
1063 crtl
->stack_alignment_needed
= align
;
1064 if (crtl
->max_used_stack_slot_alignment
< align
)
1065 crtl
->max_used_stack_slot_alignment
= align
;
1067 if (TREE_CODE (origvar
) == SSA_NAME
)
1069 gcc_assert (TREE_CODE (var
) != VAR_DECL
1070 || (!DECL_EXTERNAL (var
)
1071 && !DECL_HAS_VALUE_EXPR_P (var
)
1072 && !TREE_STATIC (var
)
1073 && TREE_TYPE (var
) != error_mark_node
1074 && !DECL_HARD_REGISTER (var
)
1077 if (TREE_CODE (var
) != VAR_DECL
&& TREE_CODE (origvar
) != SSA_NAME
)
1079 else if (DECL_EXTERNAL (var
))
1081 else if (DECL_HAS_VALUE_EXPR_P (var
))
1083 else if (TREE_STATIC (var
))
1085 else if (TREE_CODE (origvar
) != SSA_NAME
&& DECL_RTL_SET_P (var
))
1087 else if (TREE_TYPE (var
) == error_mark_node
)
1090 expand_one_error_var (var
);
1092 else if (TREE_CODE (var
) == VAR_DECL
&& DECL_HARD_REGISTER (var
))
1095 expand_one_hard_reg_var (var
);
1097 else if (use_register_for_decl (var
))
1100 expand_one_register_var (origvar
);
1102 else if (!host_integerp (DECL_SIZE_UNIT (var
), 1))
1106 error ("size of variable %q+D is too large", var
);
1107 expand_one_error_var (var
);
1110 else if (defer_stack_allocation (var
, toplevel
))
1111 add_stack_var (origvar
);
1115 expand_one_stack_var (origvar
);
1116 return tree_low_cst (DECL_SIZE_UNIT (var
), 1);
1121 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1122 expanding variables. Those variables that can be put into registers
1123 are allocated pseudos; those that can't are put on the stack.
1125 TOPLEVEL is true if this is the outermost BLOCK. */
1128 expand_used_vars_for_block (tree block
, bool toplevel
)
1130 size_t i
, j
, old_sv_num
, this_sv_num
, new_sv_num
;
1133 old_sv_num
= toplevel
? 0 : stack_vars_num
;
1135 /* Expand all variables at this level. */
1136 for (t
= BLOCK_VARS (block
); t
; t
= DECL_CHAIN (t
))
1138 expand_one_var (t
, toplevel
, true);
1140 this_sv_num
= stack_vars_num
;
1142 /* Expand all variables at containing levels. */
1143 for (t
= BLOCK_SUBBLOCKS (block
); t
; t
= BLOCK_CHAIN (t
))
1144 expand_used_vars_for_block (t
, false);
1146 /* Since we do not track exact variable lifetimes (which is not even
1147 possible for variables whose address escapes), we mirror the block
1148 tree in the interference graph. Here we cause all variables at this
1149 level, and all sublevels, to conflict. */
1150 if (old_sv_num
< this_sv_num
)
1152 new_sv_num
= stack_vars_num
;
1154 for (i
= old_sv_num
; i
< new_sv_num
; ++i
)
1155 for (j
= i
< this_sv_num
? i
: this_sv_num
; j
-- > old_sv_num
;)
1156 add_stack_var_conflict (i
, j
);
1160 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1161 and clear TREE_USED on all local variables. */
1164 clear_tree_used (tree block
)
1168 for (t
= BLOCK_VARS (block
); t
; t
= DECL_CHAIN (t
))
1169 /* if (!TREE_STATIC (t) && !DECL_EXTERNAL (t)) */
1172 for (t
= BLOCK_SUBBLOCKS (block
); t
; t
= BLOCK_CHAIN (t
))
1173 clear_tree_used (t
);
1176 /* Examine TYPE and determine a bit mask of the following features. */
1178 #define SPCT_HAS_LARGE_CHAR_ARRAY 1
1179 #define SPCT_HAS_SMALL_CHAR_ARRAY 2
1180 #define SPCT_HAS_ARRAY 4
1181 #define SPCT_HAS_AGGREGATE 8
1184 stack_protect_classify_type (tree type
)
1186 unsigned int ret
= 0;
1189 switch (TREE_CODE (type
))
1192 t
= TYPE_MAIN_VARIANT (TREE_TYPE (type
));
1193 if (t
== char_type_node
1194 || t
== signed_char_type_node
1195 || t
== unsigned_char_type_node
)
1197 unsigned HOST_WIDE_INT max
= PARAM_VALUE (PARAM_SSP_BUFFER_SIZE
);
1198 unsigned HOST_WIDE_INT len
;
1200 if (!TYPE_SIZE_UNIT (type
)
1201 || !host_integerp (TYPE_SIZE_UNIT (type
), 1))
1204 len
= tree_low_cst (TYPE_SIZE_UNIT (type
), 1);
1207 ret
= SPCT_HAS_SMALL_CHAR_ARRAY
| SPCT_HAS_ARRAY
;
1209 ret
= SPCT_HAS_LARGE_CHAR_ARRAY
| SPCT_HAS_ARRAY
;
1212 ret
= SPCT_HAS_ARRAY
;
1216 case QUAL_UNION_TYPE
:
1218 ret
= SPCT_HAS_AGGREGATE
;
1219 for (t
= TYPE_FIELDS (type
); t
; t
= TREE_CHAIN (t
))
1220 if (TREE_CODE (t
) == FIELD_DECL
)
1221 ret
|= stack_protect_classify_type (TREE_TYPE (t
));
1231 /* Return nonzero if DECL should be segregated into the "vulnerable" upper
1232 part of the local stack frame. Remember if we ever return nonzero for
1233 any variable in this function. The return value is the phase number in
1234 which the variable should be allocated. */
1237 stack_protect_decl_phase (tree decl
)
1239 unsigned int bits
= stack_protect_classify_type (TREE_TYPE (decl
));
1242 if (bits
& SPCT_HAS_SMALL_CHAR_ARRAY
)
1243 has_short_buffer
= true;
1245 if (flag_stack_protect
== 2)
1247 if ((bits
& (SPCT_HAS_SMALL_CHAR_ARRAY
| SPCT_HAS_LARGE_CHAR_ARRAY
))
1248 && !(bits
& SPCT_HAS_AGGREGATE
))
1250 else if (bits
& SPCT_HAS_ARRAY
)
1254 ret
= (bits
& SPCT_HAS_LARGE_CHAR_ARRAY
) != 0;
1257 has_protected_decls
= true;
1262 /* Two helper routines that check for phase 1 and phase 2. These are used
1263 as callbacks for expand_stack_vars. */
1266 stack_protect_decl_phase_1 (tree decl
)
1268 return stack_protect_decl_phase (decl
) == 1;
1272 stack_protect_decl_phase_2 (tree decl
)
1274 return stack_protect_decl_phase (decl
) == 2;
1277 /* Ensure that variables in different stack protection phases conflict
1278 so that they are not merged and share the same stack slot. */
1281 add_stack_protection_conflicts (void)
1283 size_t i
, j
, n
= stack_vars_num
;
1284 unsigned char *phase
;
1286 phase
= XNEWVEC (unsigned char, n
);
1287 for (i
= 0; i
< n
; ++i
)
1288 phase
[i
] = stack_protect_decl_phase (stack_vars
[i
].decl
);
1290 for (i
= 0; i
< n
; ++i
)
1292 unsigned char ph_i
= phase
[i
];
1293 for (j
= 0; j
< i
; ++j
)
1294 if (ph_i
!= phase
[j
])
1295 add_stack_var_conflict (i
, j
);
1301 /* Create a decl for the guard at the top of the stack frame. */
1304 create_stack_guard (void)
1306 tree guard
= build_decl (DECL_SOURCE_LOCATION (current_function_decl
),
1307 VAR_DECL
, NULL
, ptr_type_node
);
1308 TREE_THIS_VOLATILE (guard
) = 1;
1309 TREE_USED (guard
) = 1;
1310 expand_one_stack_var (guard
);
1311 crtl
->stack_protect_guard
= guard
;
1314 /* A subroutine of expand_used_vars. Walk down through the BLOCK tree
1315 expanding variables. Those variables that can be put into registers
1316 are allocated pseudos; those that can't are put on the stack.
1318 TOPLEVEL is true if this is the outermost BLOCK. */
1320 static HOST_WIDE_INT
1321 account_used_vars_for_block (tree block
, bool toplevel
)
1324 HOST_WIDE_INT size
= 0;
1326 /* Expand all variables at this level. */
1327 for (t
= BLOCK_VARS (block
); t
; t
= DECL_CHAIN (t
))
1328 if (var_ann (t
) && is_used_p (t
))
1329 size
+= expand_one_var (t
, toplevel
, false);
1331 /* Expand all variables at containing levels. */
1332 for (t
= BLOCK_SUBBLOCKS (block
); t
; t
= BLOCK_CHAIN (t
))
1333 size
+= account_used_vars_for_block (t
, false);
1338 /* Prepare for expanding variables. */
1340 init_vars_expansion (void)
1344 /* Set TREE_USED on all variables in the local_decls. */
1345 FOR_EACH_LOCAL_DECL (cfun
, ix
, t
)
1348 /* Clear TREE_USED on all variables associated with a block scope. */
1349 clear_tree_used (DECL_INITIAL (current_function_decl
));
1351 /* Initialize local stack smashing state. */
1352 has_protected_decls
= false;
1353 has_short_buffer
= false;
1356 /* Free up stack variable graph data. */
1358 fini_vars_expansion (void)
1360 size_t i
, n
= stack_vars_num
;
1361 for (i
= 0; i
< n
; i
++)
1362 BITMAP_FREE (stack_vars
[i
].conflicts
);
1363 XDELETEVEC (stack_vars
);
1364 XDELETEVEC (stack_vars_sorted
);
1366 stack_vars_alloc
= stack_vars_num
= 0;
1369 /* Make a fair guess for the size of the stack frame of the decl
1370 passed. This doesn't have to be exact, the result is only used
1371 in the inline heuristics. So we don't want to run the full stack
1372 var packing algorithm (which is quadratic in the number of stack
1373 vars). Instead, we calculate the total size of all stack vars.
1374 This turns out to be a pretty fair estimate -- packing of stack
1375 vars doesn't happen very often. */
1378 estimated_stack_frame_size (tree decl
)
1380 HOST_WIDE_INT size
= 0;
1382 tree var
, outer_block
= DECL_INITIAL (current_function_decl
);
1384 tree old_cur_fun_decl
= current_function_decl
;
1385 current_function_decl
= decl
;
1386 push_cfun (DECL_STRUCT_FUNCTION (decl
));
1388 init_vars_expansion ();
1390 FOR_EACH_LOCAL_DECL (cfun
, ix
, var
)
1392 /* TREE_USED marks local variables that do not appear in lexical
1393 blocks. We don't want to expand those that do twice. */
1394 if (TREE_USED (var
))
1395 size
+= expand_one_var (var
, true, false);
1397 size
+= account_used_vars_for_block (outer_block
, true);
1399 if (stack_vars_num
> 0)
1401 /* Fake sorting the stack vars for account_stack_vars (). */
1402 stack_vars_sorted
= XNEWVEC (size_t, stack_vars_num
);
1403 for (i
= 0; i
< stack_vars_num
; ++i
)
1404 stack_vars_sorted
[i
] = i
;
1405 size
+= account_stack_vars ();
1406 fini_vars_expansion ();
1409 current_function_decl
= old_cur_fun_decl
;
1413 /* Expand all variables used in the function. */
1416 expand_used_vars (void)
1418 tree var
, outer_block
= DECL_INITIAL (current_function_decl
);
1419 VEC(tree
,heap
) *maybe_local_decls
= NULL
;
1423 /* Compute the phase of the stack frame for this function. */
1425 int align
= PREFERRED_STACK_BOUNDARY
/ BITS_PER_UNIT
;
1426 int off
= STARTING_FRAME_OFFSET
% align
;
1427 frame_phase
= off
? align
- off
: 0;
1430 init_vars_expansion ();
1432 for (i
= 0; i
< SA
.map
->num_partitions
; i
++)
1434 tree var
= partition_to_var (SA
.map
, i
);
1436 gcc_assert (is_gimple_reg (var
));
1437 if (TREE_CODE (SSA_NAME_VAR (var
)) == VAR_DECL
)
1438 expand_one_var (var
, true, true);
1441 /* This is a PARM_DECL or RESULT_DECL. For those partitions that
1442 contain the default def (representing the parm or result itself)
1443 we don't do anything here. But those which don't contain the
1444 default def (representing a temporary based on the parm/result)
1445 we need to allocate space just like for normal VAR_DECLs. */
1446 if (!bitmap_bit_p (SA
.partition_has_default_def
, i
))
1448 expand_one_var (var
, true, true);
1449 gcc_assert (SA
.partition_to_pseudo
[i
]);
1454 /* At this point all variables on the local_decls with TREE_USED
1455 set are not associated with any block scope. Lay them out. */
1457 len
= VEC_length (tree
, cfun
->local_decls
);
1458 FOR_EACH_LOCAL_DECL (cfun
, i
, var
)
1460 bool expand_now
= false;
1462 /* Expanded above already. */
1463 if (is_gimple_reg (var
))
1465 TREE_USED (var
) = 0;
1468 /* We didn't set a block for static or extern because it's hard
1469 to tell the difference between a global variable (re)declared
1470 in a local scope, and one that's really declared there to
1471 begin with. And it doesn't really matter much, since we're
1472 not giving them stack space. Expand them now. */
1473 else if (TREE_STATIC (var
) || DECL_EXTERNAL (var
))
1476 /* If the variable is not associated with any block, then it
1477 was created by the optimizers, and could be live anywhere
1479 else if (TREE_USED (var
))
1482 /* Finally, mark all variables on the list as used. We'll use
1483 this in a moment when we expand those associated with scopes. */
1484 TREE_USED (var
) = 1;
1487 expand_one_var (var
, true, true);
1490 if (DECL_ARTIFICIAL (var
) && !DECL_IGNORED_P (var
))
1492 rtx rtl
= DECL_RTL_IF_SET (var
);
1494 /* Keep artificial non-ignored vars in cfun->local_decls
1495 chain until instantiate_decls. */
1496 if (rtl
&& (MEM_P (rtl
) || GET_CODE (rtl
) == CONCAT
))
1497 add_local_decl (cfun
, var
);
1498 else if (rtl
== NULL_RTX
)
1499 /* If rtl isn't set yet, which can happen e.g. with
1500 -fstack-protector, retry before returning from this
1502 VEC_safe_push (tree
, heap
, maybe_local_decls
, var
);
1506 /* We duplicated some of the decls in CFUN->LOCAL_DECLS.
1508 +-----------------+-----------------+
1509 | ...processed... | ...duplicates...|
1510 +-----------------+-----------------+
1512 +-- LEN points here.
1514 We just want the duplicates, as those are the artificial
1515 non-ignored vars that we want to keep until instantiate_decls.
1516 Move them down and truncate the array. */
1517 if (!VEC_empty (tree
, cfun
->local_decls
))
1518 VEC_block_remove (tree
, cfun
->local_decls
, 0, len
);
1520 /* At this point, all variables within the block tree with TREE_USED
1521 set are actually used by the optimized function. Lay them out. */
1522 expand_used_vars_for_block (outer_block
, true);
1524 if (stack_vars_num
> 0)
1526 /* Due to the way alias sets work, no variables with non-conflicting
1527 alias sets may be assigned the same address. Add conflicts to
1529 add_alias_set_conflicts ();
1531 /* If stack protection is enabled, we don't share space between
1532 vulnerable data and non-vulnerable data. */
1533 if (flag_stack_protect
)
1534 add_stack_protection_conflicts ();
1536 /* Now that we have collected all stack variables, and have computed a
1537 minimal interference graph, attempt to save some stack space. */
1538 partition_stack_vars ();
1540 dump_stack_var_partition ();
1543 /* There are several conditions under which we should create a
1544 stack guard: protect-all, alloca used, protected decls present. */
1545 if (flag_stack_protect
== 2
1546 || (flag_stack_protect
1547 && (cfun
->calls_alloca
|| has_protected_decls
)))
1548 create_stack_guard ();
1550 /* Assign rtl to each variable based on these partitions. */
1551 if (stack_vars_num
> 0)
1553 /* Reorder decls to be protected by iterating over the variables
1554 array multiple times, and allocating out of each phase in turn. */
1555 /* ??? We could probably integrate this into the qsort we did
1556 earlier, such that we naturally see these variables first,
1557 and thus naturally allocate things in the right order. */
1558 if (has_protected_decls
)
1560 /* Phase 1 contains only character arrays. */
1561 expand_stack_vars (stack_protect_decl_phase_1
);
1563 /* Phase 2 contains other kinds of arrays. */
1564 if (flag_stack_protect
== 2)
1565 expand_stack_vars (stack_protect_decl_phase_2
);
1568 expand_stack_vars (NULL
);
1570 fini_vars_expansion ();
1573 /* If there were any artificial non-ignored vars without rtl
1574 found earlier, see if deferred stack allocation hasn't assigned
1576 FOR_EACH_VEC_ELT_REVERSE (tree
, maybe_local_decls
, i
, var
)
1578 rtx rtl
= DECL_RTL_IF_SET (var
);
1580 /* Keep artificial non-ignored vars in cfun->local_decls
1581 chain until instantiate_decls. */
1582 if (rtl
&& (MEM_P (rtl
) || GET_CODE (rtl
) == CONCAT
))
1583 add_local_decl (cfun
, var
);
1585 VEC_free (tree
, heap
, maybe_local_decls
);
1587 /* If the target requires that FRAME_OFFSET be aligned, do it. */
1588 if (STACK_ALIGNMENT_NEEDED
)
1590 HOST_WIDE_INT align
= PREFERRED_STACK_BOUNDARY
/ BITS_PER_UNIT
;
1591 if (!FRAME_GROWS_DOWNWARD
)
1592 frame_offset
+= align
- 1;
1593 frame_offset
&= -align
;
1598 /* If we need to produce a detailed dump, print the tree representation
1599 for STMT to the dump file. SINCE is the last RTX after which the RTL
1600 generated for STMT should have been appended. */
1603 maybe_dump_rtl_for_gimple_stmt (gimple stmt
, rtx since
)
1605 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
1607 fprintf (dump_file
, "\n;; ");
1608 print_gimple_stmt (dump_file
, stmt
, 0,
1609 TDF_SLIM
| (dump_flags
& TDF_LINENO
));
1610 fprintf (dump_file
, "\n");
1612 print_rtl (dump_file
, since
? NEXT_INSN (since
) : since
);
1616 /* Maps the blocks that do not contain tree labels to rtx labels. */
1618 static struct pointer_map_t
*lab_rtx_for_bb
;
1620 /* Returns the label_rtx expression for a label starting basic block BB. */
1623 label_rtx_for_bb (basic_block bb ATTRIBUTE_UNUSED
)
1625 gimple_stmt_iterator gsi
;
1630 if (bb
->flags
& BB_RTL
)
1631 return block_label (bb
);
1633 elt
= pointer_map_contains (lab_rtx_for_bb
, bb
);
1637 /* Find the tree label if it is present. */
1639 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
1641 lab_stmt
= gsi_stmt (gsi
);
1642 if (gimple_code (lab_stmt
) != GIMPLE_LABEL
)
1645 lab
= gimple_label_label (lab_stmt
);
1646 if (DECL_NONLOCAL (lab
))
1649 return label_rtx (lab
);
1652 elt
= pointer_map_insert (lab_rtx_for_bb
, bb
);
1653 *elt
= gen_label_rtx ();
1658 /* A subroutine of expand_gimple_cond. Given E, a fallthrough edge
1659 of a basic block where we just expanded the conditional at the end,
1660 possibly clean up the CFG and instruction sequence. LAST is the
1661 last instruction before the just emitted jump sequence. */
1664 maybe_cleanup_end_of_block (edge e
, rtx last
)
1666 /* Special case: when jumpif decides that the condition is
1667 trivial it emits an unconditional jump (and the necessary
1668 barrier). But we still have two edges, the fallthru one is
1669 wrong. purge_dead_edges would clean this up later. Unfortunately
1670 we have to insert insns (and split edges) before
1671 find_many_sub_basic_blocks and hence before purge_dead_edges.
1672 But splitting edges might create new blocks which depend on the
1673 fact that if there are two edges there's no barrier. So the
1674 barrier would get lost and verify_flow_info would ICE. Instead
1675 of auditing all edge splitters to care for the barrier (which
1676 normally isn't there in a cleaned CFG), fix it here. */
1677 if (BARRIER_P (get_last_insn ()))
1681 /* Now, we have a single successor block, if we have insns to
1682 insert on the remaining edge we potentially will insert
1683 it at the end of this block (if the dest block isn't feasible)
1684 in order to avoid splitting the edge. This insertion will take
1685 place in front of the last jump. But we might have emitted
1686 multiple jumps (conditional and one unconditional) to the
1687 same destination. Inserting in front of the last one then
1688 is a problem. See PR 40021. We fix this by deleting all
1689 jumps except the last unconditional one. */
1690 insn
= PREV_INSN (get_last_insn ());
1691 /* Make sure we have an unconditional jump. Otherwise we're
1693 gcc_assert (JUMP_P (insn
) && !any_condjump_p (insn
));
1694 for (insn
= PREV_INSN (insn
); insn
!= last
;)
1696 insn
= PREV_INSN (insn
);
1697 if (JUMP_P (NEXT_INSN (insn
)))
1699 if (!any_condjump_p (NEXT_INSN (insn
)))
1701 gcc_assert (BARRIER_P (NEXT_INSN (NEXT_INSN (insn
))));
1702 delete_insn (NEXT_INSN (NEXT_INSN (insn
)));
1704 delete_insn (NEXT_INSN (insn
));
1710 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_COND.
1711 Returns a new basic block if we've terminated the current basic
1712 block and created a new one. */
1715 expand_gimple_cond (basic_block bb
, gimple stmt
)
1717 basic_block new_bb
, dest
;
1722 enum tree_code code
;
1725 code
= gimple_cond_code (stmt
);
1726 op0
= gimple_cond_lhs (stmt
);
1727 op1
= gimple_cond_rhs (stmt
);
1728 /* We're sometimes presented with such code:
1732 This would expand to two comparisons which then later might
1733 be cleaned up by combine. But some pattern matchers like if-conversion
1734 work better when there's only one compare, so make up for this
1735 here as special exception if TER would have made the same change. */
1736 if (gimple_cond_single_var_p (stmt
)
1738 && TREE_CODE (op0
) == SSA_NAME
1739 && bitmap_bit_p (SA
.values
, SSA_NAME_VERSION (op0
)))
1741 gimple second
= SSA_NAME_DEF_STMT (op0
);
1742 if (gimple_code (second
) == GIMPLE_ASSIGN
)
1744 enum tree_code code2
= gimple_assign_rhs_code (second
);
1745 if (TREE_CODE_CLASS (code2
) == tcc_comparison
)
1748 op0
= gimple_assign_rhs1 (second
);
1749 op1
= gimple_assign_rhs2 (second
);
1751 /* If jumps are cheap turn some more codes into
1753 else if (BRANCH_COST (optimize_insn_for_speed_p (), false) < 4)
1755 if ((code2
== BIT_AND_EXPR
1756 && TYPE_PRECISION (TREE_TYPE (op0
)) == 1
1757 && TREE_CODE (gimple_assign_rhs2 (second
)) != INTEGER_CST
)
1758 || code2
== TRUTH_AND_EXPR
)
1760 code
= TRUTH_ANDIF_EXPR
;
1761 op0
= gimple_assign_rhs1 (second
);
1762 op1
= gimple_assign_rhs2 (second
);
1764 else if (code2
== BIT_IOR_EXPR
|| code2
== TRUTH_OR_EXPR
)
1766 code
= TRUTH_ORIF_EXPR
;
1767 op0
= gimple_assign_rhs1 (second
);
1768 op1
= gimple_assign_rhs2 (second
);
1774 last2
= last
= get_last_insn ();
1776 extract_true_false_edges_from_block (bb
, &true_edge
, &false_edge
);
1777 if (gimple_has_location (stmt
))
1779 set_curr_insn_source_location (gimple_location (stmt
));
1780 set_curr_insn_block (gimple_block (stmt
));
1783 /* These flags have no purpose in RTL land. */
1784 true_edge
->flags
&= ~EDGE_TRUE_VALUE
;
1785 false_edge
->flags
&= ~EDGE_FALSE_VALUE
;
1787 /* We can either have a pure conditional jump with one fallthru edge or
1788 two-way jump that needs to be decomposed into two basic blocks. */
1789 if (false_edge
->dest
== bb
->next_bb
)
1791 jumpif_1 (code
, op0
, op1
, label_rtx_for_bb (true_edge
->dest
),
1792 true_edge
->probability
);
1793 maybe_dump_rtl_for_gimple_stmt (stmt
, last
);
1794 if (true_edge
->goto_locus
)
1796 set_curr_insn_source_location (true_edge
->goto_locus
);
1797 set_curr_insn_block (true_edge
->goto_block
);
1798 true_edge
->goto_locus
= curr_insn_locator ();
1800 true_edge
->goto_block
= NULL
;
1801 false_edge
->flags
|= EDGE_FALLTHRU
;
1802 maybe_cleanup_end_of_block (false_edge
, last
);
1805 if (true_edge
->dest
== bb
->next_bb
)
1807 jumpifnot_1 (code
, op0
, op1
, label_rtx_for_bb (false_edge
->dest
),
1808 false_edge
->probability
);
1809 maybe_dump_rtl_for_gimple_stmt (stmt
, last
);
1810 if (false_edge
->goto_locus
)
1812 set_curr_insn_source_location (false_edge
->goto_locus
);
1813 set_curr_insn_block (false_edge
->goto_block
);
1814 false_edge
->goto_locus
= curr_insn_locator ();
1816 false_edge
->goto_block
= NULL
;
1817 true_edge
->flags
|= EDGE_FALLTHRU
;
1818 maybe_cleanup_end_of_block (true_edge
, last
);
1822 jumpif_1 (code
, op0
, op1
, label_rtx_for_bb (true_edge
->dest
),
1823 true_edge
->probability
);
1824 last
= get_last_insn ();
1825 if (false_edge
->goto_locus
)
1827 set_curr_insn_source_location (false_edge
->goto_locus
);
1828 set_curr_insn_block (false_edge
->goto_block
);
1829 false_edge
->goto_locus
= curr_insn_locator ();
1831 false_edge
->goto_block
= NULL
;
1832 emit_jump (label_rtx_for_bb (false_edge
->dest
));
1835 if (BARRIER_P (BB_END (bb
)))
1836 BB_END (bb
) = PREV_INSN (BB_END (bb
));
1837 update_bb_for_insn (bb
);
1839 new_bb
= create_basic_block (NEXT_INSN (last
), get_last_insn (), bb
);
1840 dest
= false_edge
->dest
;
1841 redirect_edge_succ (false_edge
, new_bb
);
1842 false_edge
->flags
|= EDGE_FALLTHRU
;
1843 new_bb
->count
= false_edge
->count
;
1844 new_bb
->frequency
= EDGE_FREQUENCY (false_edge
);
1845 new_edge
= make_edge (new_bb
, dest
, 0);
1846 new_edge
->probability
= REG_BR_PROB_BASE
;
1847 new_edge
->count
= new_bb
->count
;
1848 if (BARRIER_P (BB_END (new_bb
)))
1849 BB_END (new_bb
) = PREV_INSN (BB_END (new_bb
));
1850 update_bb_for_insn (new_bb
);
1852 maybe_dump_rtl_for_gimple_stmt (stmt
, last2
);
1854 if (true_edge
->goto_locus
)
1856 set_curr_insn_source_location (true_edge
->goto_locus
);
1857 set_curr_insn_block (true_edge
->goto_block
);
1858 true_edge
->goto_locus
= curr_insn_locator ();
1860 true_edge
->goto_block
= NULL
;
1865 /* A subroutine of expand_gimple_stmt_1, expanding one GIMPLE_CALL
1869 expand_call_stmt (gimple stmt
)
1872 tree lhs
= gimple_call_lhs (stmt
);
1877 exp
= build_vl_exp (CALL_EXPR
, gimple_call_num_args (stmt
) + 3);
1879 CALL_EXPR_FN (exp
) = gimple_call_fn (stmt
);
1880 decl
= gimple_call_fndecl (stmt
);
1881 builtin_p
= decl
&& DECL_BUILT_IN (decl
);
1883 TREE_TYPE (exp
) = gimple_call_return_type (stmt
);
1884 CALL_EXPR_STATIC_CHAIN (exp
) = gimple_call_chain (stmt
);
1886 for (i
= 0; i
< gimple_call_num_args (stmt
); i
++)
1888 tree arg
= gimple_call_arg (stmt
, i
);
1890 /* TER addresses into arguments of builtin functions so we have a
1891 chance to infer more correct alignment information. See PR39954. */
1893 && TREE_CODE (arg
) == SSA_NAME
1894 && (def
= get_gimple_for_ssa_name (arg
))
1895 && gimple_assign_rhs_code (def
) == ADDR_EXPR
)
1896 arg
= gimple_assign_rhs1 (def
);
1897 CALL_EXPR_ARG (exp
, i
) = arg
;
1900 if (gimple_has_side_effects (stmt
))
1901 TREE_SIDE_EFFECTS (exp
) = 1;
1903 if (gimple_call_nothrow_p (stmt
))
1904 TREE_NOTHROW (exp
) = 1;
1906 CALL_EXPR_TAILCALL (exp
) = gimple_call_tail_p (stmt
);
1907 CALL_EXPR_RETURN_SLOT_OPT (exp
) = gimple_call_return_slot_opt_p (stmt
);
1908 CALL_FROM_THUNK_P (exp
) = gimple_call_from_thunk_p (stmt
);
1909 CALL_CANNOT_INLINE_P (exp
) = gimple_call_cannot_inline_p (stmt
);
1910 CALL_EXPR_VA_ARG_PACK (exp
) = gimple_call_va_arg_pack_p (stmt
);
1911 SET_EXPR_LOCATION (exp
, gimple_location (stmt
));
1912 TREE_BLOCK (exp
) = gimple_block (stmt
);
1915 expand_assignment (lhs
, exp
, false);
1917 expand_expr_real_1 (exp
, const0_rtx
, VOIDmode
, EXPAND_NORMAL
, NULL
);
1920 /* A subroutine of expand_gimple_stmt, expanding one gimple statement
1921 STMT that doesn't require special handling for outgoing edges. That
1922 is no tailcalls and no GIMPLE_COND. */
1925 expand_gimple_stmt_1 (gimple stmt
)
1928 switch (gimple_code (stmt
))
1931 op0
= gimple_goto_dest (stmt
);
1932 if (TREE_CODE (op0
) == LABEL_DECL
)
1935 expand_computed_goto (op0
);
1938 expand_label (gimple_label_label (stmt
));
1941 case GIMPLE_PREDICT
:
1947 expand_asm_stmt (stmt
);
1950 expand_call_stmt (stmt
);
1954 op0
= gimple_return_retval (stmt
);
1956 if (op0
&& op0
!= error_mark_node
)
1958 tree result
= DECL_RESULT (current_function_decl
);
1960 /* If we are not returning the current function's RESULT_DECL,
1961 build an assignment to it. */
1964 /* I believe that a function's RESULT_DECL is unique. */
1965 gcc_assert (TREE_CODE (op0
) != RESULT_DECL
);
1967 /* ??? We'd like to use simply expand_assignment here,
1968 but this fails if the value is of BLKmode but the return
1969 decl is a register. expand_return has special handling
1970 for this combination, which eventually should move
1971 to common code. See comments there. Until then, let's
1972 build a modify expression :-/ */
1973 op0
= build2 (MODIFY_EXPR
, TREE_TYPE (result
),
1978 expand_null_return ();
1980 expand_return (op0
);
1985 tree lhs
= gimple_assign_lhs (stmt
);
1987 /* Tree expand used to fiddle with |= and &= of two bitfield
1988 COMPONENT_REFs here. This can't happen with gimple, the LHS
1989 of binary assigns must be a gimple reg. */
1991 if (TREE_CODE (lhs
) != SSA_NAME
1992 || get_gimple_rhs_class (gimple_expr_code (stmt
))
1993 == GIMPLE_SINGLE_RHS
)
1995 tree rhs
= gimple_assign_rhs1 (stmt
);
1996 gcc_assert (get_gimple_rhs_class (gimple_expr_code (stmt
))
1997 == GIMPLE_SINGLE_RHS
);
1998 if (gimple_has_location (stmt
) && CAN_HAVE_LOCATION_P (rhs
))
1999 SET_EXPR_LOCATION (rhs
, gimple_location (stmt
));
2000 expand_assignment (lhs
, rhs
,
2001 gimple_assign_nontemporal_move_p (stmt
));
2006 bool nontemporal
= gimple_assign_nontemporal_move_p (stmt
);
2007 struct separate_ops ops
;
2008 bool promoted
= false;
2010 target
= expand_expr (lhs
, NULL_RTX
, VOIDmode
, EXPAND_WRITE
);
2011 if (GET_CODE (target
) == SUBREG
&& SUBREG_PROMOTED_VAR_P (target
))
2014 ops
.code
= gimple_assign_rhs_code (stmt
);
2015 ops
.type
= TREE_TYPE (lhs
);
2016 switch (get_gimple_rhs_class (gimple_expr_code (stmt
)))
2018 case GIMPLE_TERNARY_RHS
:
2019 ops
.op2
= gimple_assign_rhs3 (stmt
);
2021 case GIMPLE_BINARY_RHS
:
2022 ops
.op1
= gimple_assign_rhs2 (stmt
);
2024 case GIMPLE_UNARY_RHS
:
2025 ops
.op0
= gimple_assign_rhs1 (stmt
);
2030 ops
.location
= gimple_location (stmt
);
2032 /* If we want to use a nontemporal store, force the value to
2033 register first. If we store into a promoted register,
2034 don't directly expand to target. */
2035 temp
= nontemporal
|| promoted
? NULL_RTX
: target
;
2036 temp
= expand_expr_real_2 (&ops
, temp
, GET_MODE (target
),
2043 int unsignedp
= SUBREG_PROMOTED_UNSIGNED_P (target
);
2044 /* If TEMP is a VOIDmode constant, use convert_modes to make
2045 sure that we properly convert it. */
2046 if (CONSTANT_P (temp
) && GET_MODE (temp
) == VOIDmode
)
2048 temp
= convert_modes (GET_MODE (target
),
2049 TYPE_MODE (ops
.type
),
2051 temp
= convert_modes (GET_MODE (SUBREG_REG (target
)),
2052 GET_MODE (target
), temp
, unsignedp
);
2055 convert_move (SUBREG_REG (target
), temp
, unsignedp
);
2057 else if (nontemporal
&& emit_storent_insn (target
, temp
))
2061 temp
= force_operand (temp
, target
);
2063 emit_move_insn (target
, temp
);
2074 /* Expand one gimple statement STMT and return the last RTL instruction
2075 before any of the newly generated ones.
2077 In addition to generating the necessary RTL instructions this also
2078 sets REG_EH_REGION notes if necessary and sets the current source
2079 location for diagnostics. */
2082 expand_gimple_stmt (gimple stmt
)
2086 location_t saved_location
= input_location
;
2088 last
= get_last_insn ();
2090 /* If this is an expression of some kind and it has an associated line
2091 number, then emit the line number before expanding the expression.
2093 We need to save and restore the file and line information so that
2094 errors discovered during expansion are emitted with the right
2095 information. It would be better of the diagnostic routines
2096 used the file/line information embedded in the tree nodes rather
2100 if (gimple_has_location (stmt
))
2102 input_location
= gimple_location (stmt
);
2103 set_curr_insn_source_location (input_location
);
2105 /* Record where the insns produced belong. */
2106 set_curr_insn_block (gimple_block (stmt
));
2109 expand_gimple_stmt_1 (stmt
);
2110 /* Free any temporaries used to evaluate this statement. */
2113 input_location
= saved_location
;
2115 /* Mark all insns that may trap. */
2116 lp_nr
= lookup_stmt_eh_lp (stmt
);
2120 for (insn
= next_real_insn (last
); insn
;
2121 insn
= next_real_insn (insn
))
2123 if (! find_reg_note (insn
, REG_EH_REGION
, NULL_RTX
)
2124 /* If we want exceptions for non-call insns, any
2125 may_trap_p instruction may throw. */
2126 && GET_CODE (PATTERN (insn
)) != CLOBBER
2127 && GET_CODE (PATTERN (insn
)) != USE
2128 && insn_could_throw_p (insn
))
2129 make_reg_eh_region_note (insn
, 0, lp_nr
);
2136 /* A subroutine of expand_gimple_basic_block. Expand one GIMPLE_CALL
2137 that has CALL_EXPR_TAILCALL set. Returns non-null if we actually
2138 generated a tail call (something that might be denied by the ABI
2139 rules governing the call; see calls.c).
2141 Sets CAN_FALLTHRU if we generated a *conditional* tail call, and
2142 can still reach the rest of BB. The case here is __builtin_sqrt,
2143 where the NaN result goes through the external function (with a
2144 tailcall) and the normal result happens via a sqrt instruction. */
2147 expand_gimple_tailcall (basic_block bb
, gimple stmt
, bool *can_fallthru
)
2155 last2
= last
= expand_gimple_stmt (stmt
);
2157 for (last
= NEXT_INSN (last
); last
; last
= NEXT_INSN (last
))
2158 if (CALL_P (last
) && SIBLING_CALL_P (last
))
2161 maybe_dump_rtl_for_gimple_stmt (stmt
, last2
);
2163 *can_fallthru
= true;
2167 /* ??? Wouldn't it be better to just reset any pending stack adjust?
2168 Any instructions emitted here are about to be deleted. */
2169 do_pending_stack_adjust ();
2171 /* Remove any non-eh, non-abnormal edges that don't go to exit. */
2172 /* ??? I.e. the fallthrough edge. HOWEVER! If there were to be
2173 EH or abnormal edges, we shouldn't have created a tail call in
2174 the first place. So it seems to me we should just be removing
2175 all edges here, or redirecting the existing fallthru edge to
2181 for (ei
= ei_start (bb
->succs
); (e
= ei_safe_edge (ei
)); )
2183 if (!(e
->flags
& (EDGE_ABNORMAL
| EDGE_EH
)))
2185 if (e
->dest
!= EXIT_BLOCK_PTR
)
2187 e
->dest
->count
-= e
->count
;
2188 e
->dest
->frequency
-= EDGE_FREQUENCY (e
);
2189 if (e
->dest
->count
< 0)
2191 if (e
->dest
->frequency
< 0)
2192 e
->dest
->frequency
= 0;
2195 probability
+= e
->probability
;
2202 /* This is somewhat ugly: the call_expr expander often emits instructions
2203 after the sibcall (to perform the function return). These confuse the
2204 find_many_sub_basic_blocks code, so we need to get rid of these. */
2205 last
= NEXT_INSN (last
);
2206 gcc_assert (BARRIER_P (last
));
2208 *can_fallthru
= false;
2209 while (NEXT_INSN (last
))
2211 /* For instance an sqrt builtin expander expands if with
2212 sibcall in the then and label for `else`. */
2213 if (LABEL_P (NEXT_INSN (last
)))
2215 *can_fallthru
= true;
2218 delete_insn (NEXT_INSN (last
));
2221 e
= make_edge (bb
, EXIT_BLOCK_PTR
, EDGE_ABNORMAL
| EDGE_SIBCALL
);
2222 e
->probability
+= probability
;
2225 update_bb_for_insn (bb
);
2227 if (NEXT_INSN (last
))
2229 bb
= create_basic_block (NEXT_INSN (last
), get_last_insn (), bb
);
2232 if (BARRIER_P (last
))
2233 BB_END (bb
) = PREV_INSN (last
);
2236 maybe_dump_rtl_for_gimple_stmt (stmt
, last2
);
2241 /* Return the difference between the floor and the truncated result of
2242 a signed division by OP1 with remainder MOD. */
2244 floor_sdiv_adjust (enum machine_mode mode
, rtx mod
, rtx op1
)
2246 /* (mod != 0 ? (op1 / mod < 0 ? -1 : 0) : 0) */
2247 return gen_rtx_IF_THEN_ELSE
2248 (mode
, gen_rtx_NE (BImode
, mod
, const0_rtx
),
2249 gen_rtx_IF_THEN_ELSE
2250 (mode
, gen_rtx_LT (BImode
,
2251 gen_rtx_DIV (mode
, op1
, mod
),
2253 constm1_rtx
, const0_rtx
),
2257 /* Return the difference between the ceil and the truncated result of
2258 a signed division by OP1 with remainder MOD. */
2260 ceil_sdiv_adjust (enum machine_mode mode
, rtx mod
, rtx op1
)
2262 /* (mod != 0 ? (op1 / mod > 0 ? 1 : 0) : 0) */
2263 return gen_rtx_IF_THEN_ELSE
2264 (mode
, gen_rtx_NE (BImode
, mod
, const0_rtx
),
2265 gen_rtx_IF_THEN_ELSE
2266 (mode
, gen_rtx_GT (BImode
,
2267 gen_rtx_DIV (mode
, op1
, mod
),
2269 const1_rtx
, const0_rtx
),
2273 /* Return the difference between the ceil and the truncated result of
2274 an unsigned division by OP1 with remainder MOD. */
2276 ceil_udiv_adjust (enum machine_mode mode
, rtx mod
, rtx op1 ATTRIBUTE_UNUSED
)
2278 /* (mod != 0 ? 1 : 0) */
2279 return gen_rtx_IF_THEN_ELSE
2280 (mode
, gen_rtx_NE (BImode
, mod
, const0_rtx
),
2281 const1_rtx
, const0_rtx
);
2284 /* Return the difference between the rounded and the truncated result
2285 of a signed division by OP1 with remainder MOD. Halfway cases are
2286 rounded away from zero, rather than to the nearest even number. */
2288 round_sdiv_adjust (enum machine_mode mode
, rtx mod
, rtx op1
)
2290 /* (abs (mod) >= abs (op1) - abs (mod)
2291 ? (op1 / mod > 0 ? 1 : -1)
2293 return gen_rtx_IF_THEN_ELSE
2294 (mode
, gen_rtx_GE (BImode
, gen_rtx_ABS (mode
, mod
),
2295 gen_rtx_MINUS (mode
,
2296 gen_rtx_ABS (mode
, op1
),
2297 gen_rtx_ABS (mode
, mod
))),
2298 gen_rtx_IF_THEN_ELSE
2299 (mode
, gen_rtx_GT (BImode
,
2300 gen_rtx_DIV (mode
, op1
, mod
),
2302 const1_rtx
, constm1_rtx
),
2306 /* Return the difference between the rounded and the truncated result
2307 of a unsigned division by OP1 with remainder MOD. Halfway cases
2308 are rounded away from zero, rather than to the nearest even
2311 round_udiv_adjust (enum machine_mode mode
, rtx mod
, rtx op1
)
2313 /* (mod >= op1 - mod ? 1 : 0) */
2314 return gen_rtx_IF_THEN_ELSE
2315 (mode
, gen_rtx_GE (BImode
, mod
,
2316 gen_rtx_MINUS (mode
, op1
, mod
)),
2317 const1_rtx
, const0_rtx
);
2320 /* Convert X to MODE, that must be Pmode or ptr_mode, without emitting
2324 convert_debug_memory_address (enum machine_mode mode
, rtx x
)
2326 enum machine_mode xmode
= GET_MODE (x
);
2328 #ifndef POINTERS_EXTEND_UNSIGNED
2329 gcc_assert (mode
== Pmode
);
2330 gcc_assert (xmode
== mode
|| xmode
== VOIDmode
);
2332 gcc_assert (mode
== Pmode
|| mode
== ptr_mode
);
2334 if (GET_MODE (x
) == mode
|| GET_MODE (x
) == VOIDmode
)
2337 if (GET_MODE_BITSIZE (mode
) < GET_MODE_BITSIZE (xmode
))
2338 x
= simplify_gen_subreg (mode
, x
, xmode
,
2339 subreg_lowpart_offset
2341 else if (POINTERS_EXTEND_UNSIGNED
> 0)
2342 x
= gen_rtx_ZERO_EXTEND (mode
, x
);
2343 else if (!POINTERS_EXTEND_UNSIGNED
)
2344 x
= gen_rtx_SIGN_EXTEND (mode
, x
);
2347 #endif /* POINTERS_EXTEND_UNSIGNED */
2352 /* Return an RTX equivalent to the value of the tree expression
2356 expand_debug_expr (tree exp
)
2358 rtx op0
= NULL_RTX
, op1
= NULL_RTX
, op2
= NULL_RTX
;
2359 enum machine_mode mode
= TYPE_MODE (TREE_TYPE (exp
));
2360 int unsignedp
= TYPE_UNSIGNED (TREE_TYPE (exp
));
2363 switch (TREE_CODE_CLASS (TREE_CODE (exp
)))
2365 case tcc_expression
:
2366 switch (TREE_CODE (exp
))
2370 case WIDEN_MULT_PLUS_EXPR
:
2371 case WIDEN_MULT_MINUS_EXPR
:
2375 case TRUTH_ANDIF_EXPR
:
2376 case TRUTH_ORIF_EXPR
:
2377 case TRUTH_AND_EXPR
:
2379 case TRUTH_XOR_EXPR
:
2382 case TRUTH_NOT_EXPR
:
2391 op2
= expand_debug_expr (TREE_OPERAND (exp
, 2));
2398 case tcc_comparison
:
2399 op1
= expand_debug_expr (TREE_OPERAND (exp
, 1));
2406 op0
= expand_debug_expr (TREE_OPERAND (exp
, 0));
2416 case tcc_exceptional
:
2417 case tcc_declaration
:
2423 switch (TREE_CODE (exp
))
2426 if (!lookup_constant_def (exp
))
2428 if (strlen (TREE_STRING_POINTER (exp
)) + 1
2429 != (size_t) TREE_STRING_LENGTH (exp
))
2431 op0
= gen_rtx_CONST_STRING (Pmode
, TREE_STRING_POINTER (exp
));
2432 op0
= gen_rtx_MEM (BLKmode
, op0
);
2433 set_mem_attributes (op0
, exp
, 0);
2436 /* Fall through... */
2441 op0
= expand_expr (exp
, NULL_RTX
, mode
, EXPAND_INITIALIZER
);
2445 gcc_assert (COMPLEX_MODE_P (mode
));
2446 op0
= expand_debug_expr (TREE_REALPART (exp
));
2447 op1
= expand_debug_expr (TREE_IMAGPART (exp
));
2448 return gen_rtx_CONCAT (mode
, op0
, op1
);
2450 case DEBUG_EXPR_DECL
:
2451 op0
= DECL_RTL_IF_SET (exp
);
2456 op0
= gen_rtx_DEBUG_EXPR (mode
);
2457 DEBUG_EXPR_TREE_DECL (op0
) = exp
;
2458 SET_DECL_RTL (exp
, op0
);
2468 op0
= DECL_RTL_IF_SET (exp
);
2470 /* This decl was probably optimized away. */
2473 if (TREE_CODE (exp
) != VAR_DECL
2474 || DECL_EXTERNAL (exp
)
2475 || !TREE_STATIC (exp
)
2477 || DECL_HARD_REGISTER (exp
)
2478 || mode
== VOIDmode
)
2481 op0
= make_decl_rtl_for_debug (exp
);
2483 || GET_CODE (XEXP (op0
, 0)) != SYMBOL_REF
2484 || SYMBOL_REF_DECL (XEXP (op0
, 0)) != exp
)
2488 op0
= copy_rtx (op0
);
2490 if (GET_MODE (op0
) == BLKmode
2491 /* If op0 is not BLKmode, but BLKmode is, adjust_mode
2492 below would ICE. While it is likely a FE bug,
2493 try to be robust here. See PR43166. */
2495 || (mode
== VOIDmode
&& GET_MODE (op0
) != VOIDmode
))
2497 gcc_assert (MEM_P (op0
));
2498 op0
= adjust_address_nv (op0
, mode
, 0);
2509 enum machine_mode inner_mode
= GET_MODE (op0
);
2511 if (mode
== inner_mode
)
2514 if (inner_mode
== VOIDmode
)
2516 if (TREE_CODE (exp
) == SSA_NAME
)
2517 inner_mode
= TYPE_MODE (TREE_TYPE (exp
));
2519 inner_mode
= TYPE_MODE (TREE_TYPE (TREE_OPERAND (exp
, 0)));
2520 if (mode
== inner_mode
)
2524 if (FLOAT_MODE_P (mode
) && FLOAT_MODE_P (inner_mode
))
2526 if (GET_MODE_BITSIZE (mode
) == GET_MODE_BITSIZE (inner_mode
))
2527 op0
= simplify_gen_subreg (mode
, op0
, inner_mode
, 0);
2528 else if (GET_MODE_BITSIZE (mode
) < GET_MODE_BITSIZE (inner_mode
))
2529 op0
= simplify_gen_unary (FLOAT_TRUNCATE
, mode
, op0
, inner_mode
);
2531 op0
= simplify_gen_unary (FLOAT_EXTEND
, mode
, op0
, inner_mode
);
2533 else if (FLOAT_MODE_P (mode
))
2535 gcc_assert (TREE_CODE (exp
) != SSA_NAME
);
2536 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp
, 0))))
2537 op0
= simplify_gen_unary (UNSIGNED_FLOAT
, mode
, op0
, inner_mode
);
2539 op0
= simplify_gen_unary (FLOAT
, mode
, op0
, inner_mode
);
2541 else if (FLOAT_MODE_P (inner_mode
))
2544 op0
= simplify_gen_unary (UNSIGNED_FIX
, mode
, op0
, inner_mode
);
2546 op0
= simplify_gen_unary (FIX
, mode
, op0
, inner_mode
);
2548 else if (CONSTANT_P (op0
)
2549 || GET_MODE_BITSIZE (mode
) <= GET_MODE_BITSIZE (inner_mode
))
2550 op0
= simplify_gen_subreg (mode
, op0
, inner_mode
,
2551 subreg_lowpart_offset (mode
,
2553 else if (TREE_CODE_CLASS (TREE_CODE (exp
)) == tcc_unary
2554 ? TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp
, 0)))
2556 op0
= gen_rtx_ZERO_EXTEND (mode
, op0
);
2558 op0
= gen_rtx_SIGN_EXTEND (mode
, op0
);
2565 op0
= expand_debug_expr (TREE_OPERAND (exp
, 0));
2569 if (TREE_CODE (exp
) == MEM_REF
)
2571 if (GET_CODE (op0
) == DEBUG_IMPLICIT_PTR
2572 || (GET_CODE (op0
) == PLUS
2573 && GET_CODE (XEXP (op0
, 0)) == DEBUG_IMPLICIT_PTR
))
2574 /* (mem (debug_implicit_ptr)) might confuse aliasing.
2575 Instead just use get_inner_reference. */
2578 op1
= expand_debug_expr (TREE_OPERAND (exp
, 1));
2579 if (!op1
|| !CONST_INT_P (op1
))
2582 op0
= plus_constant (op0
, INTVAL (op1
));
2585 if (POINTER_TYPE_P (TREE_TYPE (exp
)))
2586 as
= TYPE_ADDR_SPACE (TREE_TYPE (TREE_TYPE (exp
)));
2588 as
= ADDR_SPACE_GENERIC
;
2590 op0
= gen_rtx_MEM (mode
, op0
);
2592 set_mem_attributes (op0
, exp
, 0);
2593 set_mem_addr_space (op0
, as
);
2597 case TARGET_MEM_REF
:
2598 if (TREE_CODE (TMR_BASE (exp
)) == ADDR_EXPR
2599 && !DECL_RTL_SET_P (TREE_OPERAND (TMR_BASE (exp
), 0)))
2602 op0
= expand_debug_expr
2603 (tree_mem_ref_addr (build_pointer_type (TREE_TYPE (exp
)), exp
));
2607 as
= TYPE_ADDR_SPACE (TREE_TYPE (exp
));
2609 op0
= gen_rtx_MEM (mode
, op0
);
2611 set_mem_attributes (op0
, exp
, 0);
2612 set_mem_addr_space (op0
, as
);
2618 case ARRAY_RANGE_REF
:
2623 case VIEW_CONVERT_EXPR
:
2625 enum machine_mode mode1
;
2626 HOST_WIDE_INT bitsize
, bitpos
;
2629 tree tem
= get_inner_reference (exp
, &bitsize
, &bitpos
, &offset
,
2630 &mode1
, &unsignedp
, &volatilep
, false);
2636 orig_op0
= op0
= expand_debug_expr (tem
);
2643 enum machine_mode addrmode
, offmode
;
2648 op0
= XEXP (op0
, 0);
2649 addrmode
= GET_MODE (op0
);
2650 if (addrmode
== VOIDmode
)
2653 op1
= expand_debug_expr (offset
);
2657 offmode
= GET_MODE (op1
);
2658 if (offmode
== VOIDmode
)
2659 offmode
= TYPE_MODE (TREE_TYPE (offset
));
2661 if (addrmode
!= offmode
)
2662 op1
= simplify_gen_subreg (addrmode
, op1
, offmode
,
2663 subreg_lowpart_offset (addrmode
,
2666 /* Don't use offset_address here, we don't need a
2667 recognizable address, and we don't want to generate
2669 op0
= gen_rtx_MEM (mode
, gen_rtx_PLUS (addrmode
, op0
, op1
));
2674 if (mode1
== VOIDmode
)
2676 mode1
= smallest_mode_for_size (bitsize
, MODE_INT
);
2677 if (bitpos
>= BITS_PER_UNIT
)
2679 op0
= adjust_address_nv (op0
, mode1
, bitpos
/ BITS_PER_UNIT
);
2680 bitpos
%= BITS_PER_UNIT
;
2682 else if (bitpos
< 0)
2685 = (-bitpos
+ BITS_PER_UNIT
- 1) / BITS_PER_UNIT
;
2686 op0
= adjust_address_nv (op0
, mode1
, units
);
2687 bitpos
+= units
* BITS_PER_UNIT
;
2689 else if (bitpos
== 0 && bitsize
== GET_MODE_BITSIZE (mode
))
2690 op0
= adjust_address_nv (op0
, mode
, 0);
2691 else if (GET_MODE (op0
) != mode1
)
2692 op0
= adjust_address_nv (op0
, mode1
, 0);
2694 op0
= copy_rtx (op0
);
2695 if (op0
== orig_op0
)
2696 op0
= shallow_copy_rtx (op0
);
2697 set_mem_attributes (op0
, exp
, 0);
2700 if (bitpos
== 0 && mode
== GET_MODE (op0
))
2706 if (GET_MODE (op0
) == BLKmode
)
2709 if ((bitpos
% BITS_PER_UNIT
) == 0
2710 && bitsize
== GET_MODE_BITSIZE (mode1
))
2712 enum machine_mode opmode
= GET_MODE (op0
);
2714 if (opmode
== VOIDmode
)
2715 opmode
= TYPE_MODE (TREE_TYPE (tem
));
2717 /* This condition may hold if we're expanding the address
2718 right past the end of an array that turned out not to
2719 be addressable (i.e., the address was only computed in
2720 debug stmts). The gen_subreg below would rightfully
2721 crash, and the address doesn't really exist, so just
2723 if (bitpos
>= GET_MODE_BITSIZE (opmode
))
2726 if ((bitpos
% GET_MODE_BITSIZE (mode
)) == 0)
2727 return simplify_gen_subreg (mode
, op0
, opmode
,
2728 bitpos
/ BITS_PER_UNIT
);
2731 return simplify_gen_ternary (SCALAR_INT_MODE_P (GET_MODE (op0
))
2732 && TYPE_UNSIGNED (TREE_TYPE (exp
))
2734 : ZERO_EXTRACT
, mode
,
2735 GET_MODE (op0
) != VOIDmode
2737 : TYPE_MODE (TREE_TYPE (tem
)),
2738 op0
, GEN_INT (bitsize
), GEN_INT (bitpos
));
2742 return gen_rtx_ABS (mode
, op0
);
2745 return gen_rtx_NEG (mode
, op0
);
2748 return gen_rtx_NOT (mode
, op0
);
2752 return gen_rtx_UNSIGNED_FLOAT (mode
, op0
);
2754 return gen_rtx_FLOAT (mode
, op0
);
2756 case FIX_TRUNC_EXPR
:
2758 return gen_rtx_UNSIGNED_FIX (mode
, op0
);
2760 return gen_rtx_FIX (mode
, op0
);
2762 case POINTER_PLUS_EXPR
:
2763 /* For the rare target where pointers are not the same size as
2764 size_t, we need to check for mis-matched modes and correct
2767 && GET_MODE (op0
) != VOIDmode
&& GET_MODE (op1
) != VOIDmode
2768 && GET_MODE (op0
) != GET_MODE (op1
))
2770 if (GET_MODE_BITSIZE (GET_MODE (op0
)) < GET_MODE_BITSIZE (GET_MODE (op1
)))
2771 op1
= gen_rtx_TRUNCATE (GET_MODE (op0
), op1
);
2773 /* We always sign-extend, regardless of the signedness of
2774 the operand, because the operand is always unsigned
2775 here even if the original C expression is signed. */
2776 op1
= gen_rtx_SIGN_EXTEND (GET_MODE (op0
), op1
);
2780 return gen_rtx_PLUS (mode
, op0
, op1
);
2783 return gen_rtx_MINUS (mode
, op0
, op1
);
2786 return gen_rtx_MULT (mode
, op0
, op1
);
2789 case TRUNC_DIV_EXPR
:
2790 case EXACT_DIV_EXPR
:
2792 return gen_rtx_UDIV (mode
, op0
, op1
);
2794 return gen_rtx_DIV (mode
, op0
, op1
);
2796 case TRUNC_MOD_EXPR
:
2798 return gen_rtx_UMOD (mode
, op0
, op1
);
2800 return gen_rtx_MOD (mode
, op0
, op1
);
2802 case FLOOR_DIV_EXPR
:
2804 return gen_rtx_UDIV (mode
, op0
, op1
);
2807 rtx div
= gen_rtx_DIV (mode
, op0
, op1
);
2808 rtx mod
= gen_rtx_MOD (mode
, op0
, op1
);
2809 rtx adj
= floor_sdiv_adjust (mode
, mod
, op1
);
2810 return gen_rtx_PLUS (mode
, div
, adj
);
2813 case FLOOR_MOD_EXPR
:
2815 return gen_rtx_UMOD (mode
, op0
, op1
);
2818 rtx mod
= gen_rtx_MOD (mode
, op0
, op1
);
2819 rtx adj
= floor_sdiv_adjust (mode
, mod
, op1
);
2820 adj
= gen_rtx_NEG (mode
, gen_rtx_MULT (mode
, adj
, op1
));
2821 return gen_rtx_PLUS (mode
, mod
, adj
);
2827 rtx div
= gen_rtx_UDIV (mode
, op0
, op1
);
2828 rtx mod
= gen_rtx_UMOD (mode
, op0
, op1
);
2829 rtx adj
= ceil_udiv_adjust (mode
, mod
, op1
);
2830 return gen_rtx_PLUS (mode
, div
, adj
);
2834 rtx div
= gen_rtx_DIV (mode
, op0
, op1
);
2835 rtx mod
= gen_rtx_MOD (mode
, op0
, op1
);
2836 rtx adj
= ceil_sdiv_adjust (mode
, mod
, op1
);
2837 return gen_rtx_PLUS (mode
, div
, adj
);
2843 rtx mod
= gen_rtx_UMOD (mode
, op0
, op1
);
2844 rtx adj
= ceil_udiv_adjust (mode
, mod
, op1
);
2845 adj
= gen_rtx_NEG (mode
, gen_rtx_MULT (mode
, adj
, op1
));
2846 return gen_rtx_PLUS (mode
, mod
, adj
);
2850 rtx mod
= gen_rtx_MOD (mode
, op0
, op1
);
2851 rtx adj
= ceil_sdiv_adjust (mode
, mod
, op1
);
2852 adj
= gen_rtx_NEG (mode
, gen_rtx_MULT (mode
, adj
, op1
));
2853 return gen_rtx_PLUS (mode
, mod
, adj
);
2856 case ROUND_DIV_EXPR
:
2859 rtx div
= gen_rtx_UDIV (mode
, op0
, op1
);
2860 rtx mod
= gen_rtx_UMOD (mode
, op0
, op1
);
2861 rtx adj
= round_udiv_adjust (mode
, mod
, op1
);
2862 return gen_rtx_PLUS (mode
, div
, adj
);
2866 rtx div
= gen_rtx_DIV (mode
, op0
, op1
);
2867 rtx mod
= gen_rtx_MOD (mode
, op0
, op1
);
2868 rtx adj
= round_sdiv_adjust (mode
, mod
, op1
);
2869 return gen_rtx_PLUS (mode
, div
, adj
);
2872 case ROUND_MOD_EXPR
:
2875 rtx mod
= gen_rtx_UMOD (mode
, op0
, op1
);
2876 rtx adj
= round_udiv_adjust (mode
, mod
, op1
);
2877 adj
= gen_rtx_NEG (mode
, gen_rtx_MULT (mode
, adj
, op1
));
2878 return gen_rtx_PLUS (mode
, mod
, adj
);
2882 rtx mod
= gen_rtx_MOD (mode
, op0
, op1
);
2883 rtx adj
= round_sdiv_adjust (mode
, mod
, op1
);
2884 adj
= gen_rtx_NEG (mode
, gen_rtx_MULT (mode
, adj
, op1
));
2885 return gen_rtx_PLUS (mode
, mod
, adj
);
2889 return gen_rtx_ASHIFT (mode
, op0
, op1
);
2893 return gen_rtx_LSHIFTRT (mode
, op0
, op1
);
2895 return gen_rtx_ASHIFTRT (mode
, op0
, op1
);
2898 return gen_rtx_ROTATE (mode
, op0
, op1
);
2901 return gen_rtx_ROTATERT (mode
, op0
, op1
);
2905 return gen_rtx_UMIN (mode
, op0
, op1
);
2907 return gen_rtx_SMIN (mode
, op0
, op1
);
2911 return gen_rtx_UMAX (mode
, op0
, op1
);
2913 return gen_rtx_SMAX (mode
, op0
, op1
);
2916 case TRUTH_AND_EXPR
:
2917 return gen_rtx_AND (mode
, op0
, op1
);
2921 return gen_rtx_IOR (mode
, op0
, op1
);
2924 case TRUTH_XOR_EXPR
:
2925 return gen_rtx_XOR (mode
, op0
, op1
);
2927 case TRUTH_ANDIF_EXPR
:
2928 return gen_rtx_IF_THEN_ELSE (mode
, op0
, op1
, const0_rtx
);
2930 case TRUTH_ORIF_EXPR
:
2931 return gen_rtx_IF_THEN_ELSE (mode
, op0
, const_true_rtx
, op1
);
2933 case TRUTH_NOT_EXPR
:
2934 return gen_rtx_EQ (mode
, op0
, const0_rtx
);
2938 return gen_rtx_LTU (mode
, op0
, op1
);
2940 return gen_rtx_LT (mode
, op0
, op1
);
2944 return gen_rtx_LEU (mode
, op0
, op1
);
2946 return gen_rtx_LE (mode
, op0
, op1
);
2950 return gen_rtx_GTU (mode
, op0
, op1
);
2952 return gen_rtx_GT (mode
, op0
, op1
);
2956 return gen_rtx_GEU (mode
, op0
, op1
);
2958 return gen_rtx_GE (mode
, op0
, op1
);
2961 return gen_rtx_EQ (mode
, op0
, op1
);
2964 return gen_rtx_NE (mode
, op0
, op1
);
2966 case UNORDERED_EXPR
:
2967 return gen_rtx_UNORDERED (mode
, op0
, op1
);
2970 return gen_rtx_ORDERED (mode
, op0
, op1
);
2973 return gen_rtx_UNLT (mode
, op0
, op1
);
2976 return gen_rtx_UNLE (mode
, op0
, op1
);
2979 return gen_rtx_UNGT (mode
, op0
, op1
);
2982 return gen_rtx_UNGE (mode
, op0
, op1
);
2985 return gen_rtx_UNEQ (mode
, op0
, op1
);
2988 return gen_rtx_LTGT (mode
, op0
, op1
);
2991 return gen_rtx_IF_THEN_ELSE (mode
, op0
, op1
, op2
);
2994 gcc_assert (COMPLEX_MODE_P (mode
));
2995 if (GET_MODE (op0
) == VOIDmode
)
2996 op0
= gen_rtx_CONST (GET_MODE_INNER (mode
), op0
);
2997 if (GET_MODE (op1
) == VOIDmode
)
2998 op1
= gen_rtx_CONST (GET_MODE_INNER (mode
), op1
);
2999 return gen_rtx_CONCAT (mode
, op0
, op1
);
3002 if (GET_CODE (op0
) == CONCAT
)
3003 return gen_rtx_CONCAT (mode
, XEXP (op0
, 0),
3004 gen_rtx_NEG (GET_MODE_INNER (mode
),
3008 enum machine_mode imode
= GET_MODE_INNER (mode
);
3013 re
= adjust_address_nv (op0
, imode
, 0);
3014 im
= adjust_address_nv (op0
, imode
, GET_MODE_SIZE (imode
));
3018 enum machine_mode ifmode
= int_mode_for_mode (mode
);
3019 enum machine_mode ihmode
= int_mode_for_mode (imode
);
3021 if (ifmode
== BLKmode
|| ihmode
== BLKmode
)
3023 halfsize
= GEN_INT (GET_MODE_BITSIZE (ihmode
));
3026 re
= gen_rtx_SUBREG (ifmode
, re
, 0);
3027 re
= gen_rtx_ZERO_EXTRACT (ihmode
, re
, halfsize
, const0_rtx
);
3028 if (imode
!= ihmode
)
3029 re
= gen_rtx_SUBREG (imode
, re
, 0);
3030 im
= copy_rtx (op0
);
3032 im
= gen_rtx_SUBREG (ifmode
, im
, 0);
3033 im
= gen_rtx_ZERO_EXTRACT (ihmode
, im
, halfsize
, halfsize
);
3034 if (imode
!= ihmode
)
3035 im
= gen_rtx_SUBREG (imode
, im
, 0);
3037 im
= gen_rtx_NEG (imode
, im
);
3038 return gen_rtx_CONCAT (mode
, re
, im
);
3042 op0
= expand_debug_expr (TREE_OPERAND (exp
, 0));
3043 if (!op0
|| !MEM_P (op0
))
3045 if ((TREE_CODE (TREE_OPERAND (exp
, 0)) == VAR_DECL
3046 || TREE_CODE (TREE_OPERAND (exp
, 0)) == PARM_DECL
3047 || TREE_CODE (TREE_OPERAND (exp
, 0)) == RESULT_DECL
)
3048 && !TREE_ADDRESSABLE (TREE_OPERAND (exp
, 0)))
3049 return gen_rtx_DEBUG_IMPLICIT_PTR (mode
, TREE_OPERAND (exp
, 0));
3051 if (handled_component_p (TREE_OPERAND (exp
, 0)))
3053 HOST_WIDE_INT bitoffset
, bitsize
, maxsize
;
3055 = get_ref_base_and_extent (TREE_OPERAND (exp
, 0),
3056 &bitoffset
, &bitsize
, &maxsize
);
3057 if ((TREE_CODE (decl
) == VAR_DECL
3058 || TREE_CODE (decl
) == PARM_DECL
3059 || TREE_CODE (decl
) == RESULT_DECL
)
3060 && !TREE_ADDRESSABLE (decl
)
3061 && (bitoffset
% BITS_PER_UNIT
) == 0
3063 && bitsize
== maxsize
)
3064 return plus_constant (gen_rtx_DEBUG_IMPLICIT_PTR (mode
, decl
),
3065 bitoffset
/ BITS_PER_UNIT
);
3071 op0
= convert_debug_memory_address (mode
, XEXP (op0
, 0));
3076 exp
= build_constructor_from_list (TREE_TYPE (exp
),
3077 TREE_VECTOR_CST_ELTS (exp
));
3081 if (TREE_CODE (TREE_TYPE (exp
)) == VECTOR_TYPE
)
3086 op0
= gen_rtx_CONCATN
3087 (mode
, rtvec_alloc (TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp
))));
3089 FOR_EACH_CONSTRUCTOR_VALUE (CONSTRUCTOR_ELTS (exp
), i
, val
)
3091 op1
= expand_debug_expr (val
);
3094 XVECEXP (op0
, 0, i
) = op1
;
3097 if (i
< TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp
)))
3099 op1
= expand_debug_expr
3100 (build_zero_cst (TREE_TYPE (TREE_TYPE (exp
))));
3105 for (; i
< TYPE_VECTOR_SUBPARTS (TREE_TYPE (exp
)); i
++)
3106 XVECEXP (op0
, 0, i
) = op1
;
3112 goto flag_unsupported
;
3115 /* ??? Maybe handle some builtins? */
3120 gimple g
= get_gimple_for_ssa_name (exp
);
3123 op0
= expand_debug_expr (gimple_assign_rhs_to_tree (g
));
3129 int part
= var_to_partition (SA
.map
, exp
);
3131 if (part
== NO_PARTITION
)
3134 gcc_assert (part
>= 0 && (unsigned)part
< SA
.map
->num_partitions
);
3136 op0
= SA
.partition_to_pseudo
[part
];
3144 /* Vector stuff. For most of the codes we don't have rtl codes. */
3145 case REALIGN_LOAD_EXPR
:
3146 case REDUC_MAX_EXPR
:
3147 case REDUC_MIN_EXPR
:
3148 case REDUC_PLUS_EXPR
:
3150 case VEC_EXTRACT_EVEN_EXPR
:
3151 case VEC_EXTRACT_ODD_EXPR
:
3152 case VEC_INTERLEAVE_HIGH_EXPR
:
3153 case VEC_INTERLEAVE_LOW_EXPR
:
3154 case VEC_LSHIFT_EXPR
:
3155 case VEC_PACK_FIX_TRUNC_EXPR
:
3156 case VEC_PACK_SAT_EXPR
:
3157 case VEC_PACK_TRUNC_EXPR
:
3158 case VEC_RSHIFT_EXPR
:
3159 case VEC_UNPACK_FLOAT_HI_EXPR
:
3160 case VEC_UNPACK_FLOAT_LO_EXPR
:
3161 case VEC_UNPACK_HI_EXPR
:
3162 case VEC_UNPACK_LO_EXPR
:
3163 case VEC_WIDEN_MULT_HI_EXPR
:
3164 case VEC_WIDEN_MULT_LO_EXPR
:
3168 case ADDR_SPACE_CONVERT_EXPR
:
3169 case FIXED_CONVERT_EXPR
:
3171 case WITH_SIZE_EXPR
:
3175 if (SCALAR_INT_MODE_P (GET_MODE (op0
))
3176 && SCALAR_INT_MODE_P (mode
))
3178 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp
, 0))))
3179 op0
= gen_rtx_ZERO_EXTEND (mode
, op0
);
3181 op0
= gen_rtx_SIGN_EXTEND (mode
, op0
);
3182 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp
, 1))))
3183 op1
= gen_rtx_ZERO_EXTEND (mode
, op1
);
3185 op1
= gen_rtx_SIGN_EXTEND (mode
, op1
);
3186 op0
= gen_rtx_MULT (mode
, op0
, op1
);
3187 return gen_rtx_PLUS (mode
, op0
, op2
);
3191 case WIDEN_MULT_EXPR
:
3192 case WIDEN_MULT_PLUS_EXPR
:
3193 case WIDEN_MULT_MINUS_EXPR
:
3194 if (SCALAR_INT_MODE_P (GET_MODE (op0
))
3195 && SCALAR_INT_MODE_P (mode
))
3197 enum machine_mode inner_mode
= GET_MODE (op0
);
3198 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp
, 0))))
3199 op0
= simplify_gen_unary (ZERO_EXTEND
, mode
, op0
, inner_mode
);
3201 op0
= simplify_gen_unary (SIGN_EXTEND
, mode
, op0
, inner_mode
);
3202 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp
, 1))))
3203 op1
= simplify_gen_unary (ZERO_EXTEND
, mode
, op1
, inner_mode
);
3205 op1
= simplify_gen_unary (SIGN_EXTEND
, mode
, op1
, inner_mode
);
3206 op0
= gen_rtx_MULT (mode
, op0
, op1
);
3207 if (TREE_CODE (exp
) == WIDEN_MULT_EXPR
)
3209 else if (TREE_CODE (exp
) == WIDEN_MULT_PLUS_EXPR
)
3210 return gen_rtx_PLUS (mode
, op0
, op2
);
3212 return gen_rtx_MINUS (mode
, op2
, op0
);
3216 case WIDEN_SUM_EXPR
:
3217 if (SCALAR_INT_MODE_P (GET_MODE (op0
))
3218 && SCALAR_INT_MODE_P (mode
))
3220 if (TYPE_UNSIGNED (TREE_TYPE (TREE_OPERAND (exp
, 0))))
3221 op0
= gen_rtx_ZERO_EXTEND (mode
, op0
);
3223 op0
= gen_rtx_SIGN_EXTEND (mode
, op0
);
3224 return gen_rtx_PLUS (mode
, op0
, op1
);
3229 return gen_rtx_FMA (mode
, op0
, op1
, op2
);
3233 #ifdef ENABLE_CHECKING
3242 /* Expand the _LOCs in debug insns. We run this after expanding all
3243 regular insns, so that any variables referenced in the function
3244 will have their DECL_RTLs set. */
3247 expand_debug_locations (void)
3250 rtx last
= get_last_insn ();
3251 int save_strict_alias
= flag_strict_aliasing
;
3253 /* New alias sets while setting up memory attributes cause
3254 -fcompare-debug failures, even though it doesn't bring about any
3256 flag_strict_aliasing
= 0;
3258 for (insn
= get_insns (); insn
; insn
= NEXT_INSN (insn
))
3259 if (DEBUG_INSN_P (insn
))
3261 tree value
= (tree
)INSN_VAR_LOCATION_LOC (insn
);
3263 enum machine_mode mode
;
3265 if (value
== NULL_TREE
)
3269 val
= expand_debug_expr (value
);
3270 gcc_assert (last
== get_last_insn ());
3274 val
= gen_rtx_UNKNOWN_VAR_LOC ();
3277 mode
= GET_MODE (INSN_VAR_LOCATION (insn
));
3279 gcc_assert (mode
== GET_MODE (val
)
3280 || (GET_MODE (val
) == VOIDmode
3281 && (CONST_INT_P (val
)
3282 || GET_CODE (val
) == CONST_FIXED
3283 || GET_CODE (val
) == CONST_DOUBLE
3284 || GET_CODE (val
) == LABEL_REF
)));
3287 INSN_VAR_LOCATION_LOC (insn
) = val
;
3290 flag_strict_aliasing
= save_strict_alias
;
3293 /* Expand basic block BB from GIMPLE trees to RTL. */
3296 expand_gimple_basic_block (basic_block bb
)
3298 gimple_stmt_iterator gsi
;
3307 fprintf (dump_file
, "\n;; Generating RTL for gimple basic block %d\n",
3310 /* Note that since we are now transitioning from GIMPLE to RTL, we
3311 cannot use the gsi_*_bb() routines because they expect the basic
3312 block to be in GIMPLE, instead of RTL. Therefore, we need to
3313 access the BB sequence directly. */
3314 stmts
= bb_seq (bb
);
3315 bb
->il
.gimple
= NULL
;
3316 rtl_profile_for_bb (bb
);
3317 init_rtl_bb_info (bb
);
3318 bb
->flags
|= BB_RTL
;
3320 /* Remove the RETURN_EXPR if we may fall though to the exit
3322 gsi
= gsi_last (stmts
);
3323 if (!gsi_end_p (gsi
)
3324 && gimple_code (gsi_stmt (gsi
)) == GIMPLE_RETURN
)
3326 gimple ret_stmt
= gsi_stmt (gsi
);
3328 gcc_assert (single_succ_p (bb
));
3329 gcc_assert (single_succ (bb
) == EXIT_BLOCK_PTR
);
3331 if (bb
->next_bb
== EXIT_BLOCK_PTR
3332 && !gimple_return_retval (ret_stmt
))
3334 gsi_remove (&gsi
, false);
3335 single_succ_edge (bb
)->flags
|= EDGE_FALLTHRU
;
3339 gsi
= gsi_start (stmts
);
3340 if (!gsi_end_p (gsi
))
3342 stmt
= gsi_stmt (gsi
);
3343 if (gimple_code (stmt
) != GIMPLE_LABEL
)
3347 elt
= pointer_map_contains (lab_rtx_for_bb
, bb
);
3351 last
= get_last_insn ();
3355 expand_gimple_stmt (stmt
);
3360 emit_label ((rtx
) *elt
);
3362 /* Java emits line number notes in the top of labels.
3363 ??? Make this go away once line number notes are obsoleted. */
3364 BB_HEAD (bb
) = NEXT_INSN (last
);
3365 if (NOTE_P (BB_HEAD (bb
)))
3366 BB_HEAD (bb
) = NEXT_INSN (BB_HEAD (bb
));
3367 note
= emit_note_after (NOTE_INSN_BASIC_BLOCK
, BB_HEAD (bb
));
3369 maybe_dump_rtl_for_gimple_stmt (stmt
, last
);
3372 note
= BB_HEAD (bb
) = emit_note (NOTE_INSN_BASIC_BLOCK
);
3374 NOTE_BASIC_BLOCK (note
) = bb
;
3376 for (; !gsi_end_p (gsi
); gsi_next (&gsi
))
3380 stmt
= gsi_stmt (gsi
);
3382 /* If this statement is a non-debug one, and we generate debug
3383 insns, then this one might be the last real use of a TERed
3384 SSA_NAME, but where there are still some debug uses further
3385 down. Expanding the current SSA name in such further debug
3386 uses by their RHS might lead to wrong debug info, as coalescing
3387 might make the operands of such RHS be placed into the same
3388 pseudo as something else. Like so:
3389 a_1 = a_0 + 1; // Assume a_1 is TERed and a_0 is dead
3393 As a_0 and a_2 don't overlap in lifetime, assume they are coalesced.
3394 If we now would expand a_1 by it's RHS (a_0 + 1) in the debug use,
3395 the write to a_2 would actually have clobbered the place which
3398 So, instead of that, we recognize the situation, and generate
3399 debug temporaries at the last real use of TERed SSA names:
3406 if (MAY_HAVE_DEBUG_INSNS
3408 && !is_gimple_debug (stmt
))
3414 location_t sloc
= get_curr_insn_source_location ();
3415 tree sblock
= get_curr_insn_block ();
3417 /* Look for SSA names that have their last use here (TERed
3418 names always have only one real use). */
3419 FOR_EACH_SSA_TREE_OPERAND (op
, stmt
, iter
, SSA_OP_USE
)
3420 if ((def
= get_gimple_for_ssa_name (op
)))
3422 imm_use_iterator imm_iter
;
3423 use_operand_p use_p
;
3424 bool have_debug_uses
= false;
3426 FOR_EACH_IMM_USE_FAST (use_p
, imm_iter
, op
)
3428 if (gimple_debug_bind_p (USE_STMT (use_p
)))
3430 have_debug_uses
= true;
3435 if (have_debug_uses
)
3437 /* OP is a TERed SSA name, with DEF it's defining
3438 statement, and where OP is used in further debug
3439 instructions. Generate a debug temporary, and
3440 replace all uses of OP in debug insns with that
3443 tree value
= gimple_assign_rhs_to_tree (def
);
3444 tree vexpr
= make_node (DEBUG_EXPR_DECL
);
3446 enum machine_mode mode
;
3448 set_curr_insn_source_location (gimple_location (def
));
3449 set_curr_insn_block (gimple_block (def
));
3451 DECL_ARTIFICIAL (vexpr
) = 1;
3452 TREE_TYPE (vexpr
) = TREE_TYPE (value
);
3454 mode
= DECL_MODE (value
);
3456 mode
= TYPE_MODE (TREE_TYPE (value
));
3457 DECL_MODE (vexpr
) = mode
;
3459 val
= gen_rtx_VAR_LOCATION
3460 (mode
, vexpr
, (rtx
)value
, VAR_INIT_STATUS_INITIALIZED
);
3462 val
= emit_debug_insn (val
);
3464 FOR_EACH_IMM_USE_STMT (debugstmt
, imm_iter
, op
)
3466 if (!gimple_debug_bind_p (debugstmt
))
3469 FOR_EACH_IMM_USE_ON_STMT (use_p
, imm_iter
)
3470 SET_USE (use_p
, vexpr
);
3472 update_stmt (debugstmt
);
3476 set_curr_insn_source_location (sloc
);
3477 set_curr_insn_block (sblock
);
3480 currently_expanding_gimple_stmt
= stmt
;
3482 /* Expand this statement, then evaluate the resulting RTL and
3483 fixup the CFG accordingly. */
3484 if (gimple_code (stmt
) == GIMPLE_COND
)
3486 new_bb
= expand_gimple_cond (bb
, stmt
);
3490 else if (gimple_debug_bind_p (stmt
))
3492 location_t sloc
= get_curr_insn_source_location ();
3493 tree sblock
= get_curr_insn_block ();
3494 gimple_stmt_iterator nsi
= gsi
;
3498 tree var
= gimple_debug_bind_get_var (stmt
);
3501 enum machine_mode mode
;
3503 if (gimple_debug_bind_has_value_p (stmt
))
3504 value
= gimple_debug_bind_get_value (stmt
);
3508 last
= get_last_insn ();
3510 set_curr_insn_source_location (gimple_location (stmt
));
3511 set_curr_insn_block (gimple_block (stmt
));
3514 mode
= DECL_MODE (var
);
3516 mode
= TYPE_MODE (TREE_TYPE (var
));
3518 val
= gen_rtx_VAR_LOCATION
3519 (mode
, var
, (rtx
)value
, VAR_INIT_STATUS_INITIALIZED
);
3521 val
= emit_debug_insn (val
);
3523 if (dump_file
&& (dump_flags
& TDF_DETAILS
))
3525 /* We can't dump the insn with a TREE where an RTX
3527 INSN_VAR_LOCATION_LOC (val
) = const0_rtx
;
3528 maybe_dump_rtl_for_gimple_stmt (stmt
, last
);
3529 INSN_VAR_LOCATION_LOC (val
) = (rtx
)value
;
3532 /* In order not to generate too many debug temporaries,
3533 we delink all uses of debug statements we already expanded.
3534 Therefore debug statements between definition and real
3535 use of TERed SSA names will continue to use the SSA name,
3536 and not be replaced with debug temps. */
3537 delink_stmt_imm_use (stmt
);
3541 if (gsi_end_p (nsi
))
3543 stmt
= gsi_stmt (nsi
);
3544 if (!gimple_debug_bind_p (stmt
))
3548 set_curr_insn_source_location (sloc
);
3549 set_curr_insn_block (sblock
);
3553 if (is_gimple_call (stmt
) && gimple_call_tail_p (stmt
))
3556 new_bb
= expand_gimple_tailcall (bb
, stmt
, &can_fallthru
);
3567 def_operand_p def_p
;
3568 def_p
= SINGLE_SSA_DEF_OPERAND (stmt
, SSA_OP_DEF
);
3572 /* Ignore this stmt if it is in the list of
3573 replaceable expressions. */
3575 && bitmap_bit_p (SA
.values
,
3576 SSA_NAME_VERSION (DEF_FROM_PTR (def_p
))))
3579 last
= expand_gimple_stmt (stmt
);
3580 maybe_dump_rtl_for_gimple_stmt (stmt
, last
);
3585 currently_expanding_gimple_stmt
= NULL
;
3587 /* Expand implicit goto and convert goto_locus. */
3588 FOR_EACH_EDGE (e
, ei
, bb
->succs
)
3590 if (e
->goto_locus
&& e
->goto_block
)
3592 set_curr_insn_source_location (e
->goto_locus
);
3593 set_curr_insn_block (e
->goto_block
);
3594 e
->goto_locus
= curr_insn_locator ();
3596 e
->goto_block
= NULL
;
3597 if ((e
->flags
& EDGE_FALLTHRU
) && e
->dest
!= bb
->next_bb
)
3599 emit_jump (label_rtx_for_bb (e
->dest
));
3600 e
->flags
&= ~EDGE_FALLTHRU
;
3604 /* Expanded RTL can create a jump in the last instruction of block.
3605 This later might be assumed to be a jump to successor and break edge insertion.
3606 We need to insert dummy move to prevent this. PR41440. */
3607 if (single_succ_p (bb
)
3608 && (single_succ_edge (bb
)->flags
& EDGE_FALLTHRU
)
3609 && (last
= get_last_insn ())
3612 rtx dummy
= gen_reg_rtx (SImode
);
3613 emit_insn_after_noloc (gen_move_insn (dummy
, dummy
), last
, NULL
);
3616 do_pending_stack_adjust ();
3618 /* Find the block tail. The last insn in the block is the insn
3619 before a barrier and/or table jump insn. */
3620 last
= get_last_insn ();
3621 if (BARRIER_P (last
))
3622 last
= PREV_INSN (last
);
3623 if (JUMP_TABLE_DATA_P (last
))
3624 last
= PREV_INSN (PREV_INSN (last
));
3627 update_bb_for_insn (bb
);
3633 /* Create a basic block for initialization code. */
3636 construct_init_block (void)
3638 basic_block init_block
, first_block
;
3642 /* Multiple entry points not supported yet. */
3643 gcc_assert (EDGE_COUNT (ENTRY_BLOCK_PTR
->succs
) == 1);
3644 init_rtl_bb_info (ENTRY_BLOCK_PTR
);
3645 init_rtl_bb_info (EXIT_BLOCK_PTR
);
3646 ENTRY_BLOCK_PTR
->flags
|= BB_RTL
;
3647 EXIT_BLOCK_PTR
->flags
|= BB_RTL
;
3649 e
= EDGE_SUCC (ENTRY_BLOCK_PTR
, 0);
3651 /* When entry edge points to first basic block, we don't need jump,
3652 otherwise we have to jump into proper target. */
3653 if (e
&& e
->dest
!= ENTRY_BLOCK_PTR
->next_bb
)
3655 tree label
= gimple_block_label (e
->dest
);
3657 emit_jump (label_rtx (label
));
3661 flags
= EDGE_FALLTHRU
;
3663 init_block
= create_basic_block (NEXT_INSN (get_insns ()),
3666 init_block
->frequency
= ENTRY_BLOCK_PTR
->frequency
;
3667 init_block
->count
= ENTRY_BLOCK_PTR
->count
;
3670 first_block
= e
->dest
;
3671 redirect_edge_succ (e
, init_block
);
3672 e
= make_edge (init_block
, first_block
, flags
);
3675 e
= make_edge (init_block
, EXIT_BLOCK_PTR
, EDGE_FALLTHRU
);
3676 e
->probability
= REG_BR_PROB_BASE
;
3677 e
->count
= ENTRY_BLOCK_PTR
->count
;
3679 update_bb_for_insn (init_block
);
3683 /* For each lexical block, set BLOCK_NUMBER to the depth at which it is
3684 found in the block tree. */
3687 set_block_levels (tree block
, int level
)
3691 BLOCK_NUMBER (block
) = level
;
3692 set_block_levels (BLOCK_SUBBLOCKS (block
), level
+ 1);
3693 block
= BLOCK_CHAIN (block
);
3697 /* Create a block containing landing pads and similar stuff. */
3700 construct_exit_block (void)
3702 rtx head
= get_last_insn ();
3704 basic_block exit_block
;
3708 rtx orig_end
= BB_END (EXIT_BLOCK_PTR
->prev_bb
);
3710 rtl_profile_for_bb (EXIT_BLOCK_PTR
);
3712 /* Make sure the locus is set to the end of the function, so that
3713 epilogue line numbers and warnings are set properly. */
3714 if (cfun
->function_end_locus
!= UNKNOWN_LOCATION
)
3715 input_location
= cfun
->function_end_locus
;
3717 /* The following insns belong to the top scope. */
3718 set_curr_insn_block (DECL_INITIAL (current_function_decl
));
3720 /* Generate rtl for function exit. */
3721 expand_function_end ();
3723 end
= get_last_insn ();
3726 /* While emitting the function end we could move end of the last basic block.
3728 BB_END (EXIT_BLOCK_PTR
->prev_bb
) = orig_end
;
3729 while (NEXT_INSN (head
) && NOTE_P (NEXT_INSN (head
)))
3730 head
= NEXT_INSN (head
);
3731 exit_block
= create_basic_block (NEXT_INSN (head
), end
,
3732 EXIT_BLOCK_PTR
->prev_bb
);
3733 exit_block
->frequency
= EXIT_BLOCK_PTR
->frequency
;
3734 exit_block
->count
= EXIT_BLOCK_PTR
->count
;
3737 while (ix
< EDGE_COUNT (EXIT_BLOCK_PTR
->preds
))
3739 e
= EDGE_PRED (EXIT_BLOCK_PTR
, ix
);
3740 if (!(e
->flags
& EDGE_ABNORMAL
))
3741 redirect_edge_succ (e
, exit_block
);
3746 e
= make_edge (exit_block
, EXIT_BLOCK_PTR
, EDGE_FALLTHRU
);
3747 e
->probability
= REG_BR_PROB_BASE
;
3748 e
->count
= EXIT_BLOCK_PTR
->count
;
3749 FOR_EACH_EDGE (e2
, ei
, EXIT_BLOCK_PTR
->preds
)
3752 e
->count
-= e2
->count
;
3753 exit_block
->count
-= e2
->count
;
3754 exit_block
->frequency
-= EDGE_FREQUENCY (e2
);
3758 if (exit_block
->count
< 0)
3759 exit_block
->count
= 0;
3760 if (exit_block
->frequency
< 0)
3761 exit_block
->frequency
= 0;
3762 update_bb_for_insn (exit_block
);
3765 /* Helper function for discover_nonconstant_array_refs.
3766 Look for ARRAY_REF nodes with non-constant indexes and mark them
3770 discover_nonconstant_array_refs_r (tree
* tp
, int *walk_subtrees
,
3771 void *data ATTRIBUTE_UNUSED
)
3775 if (IS_TYPE_OR_DECL_P (t
))
3777 else if (TREE_CODE (t
) == ARRAY_REF
|| TREE_CODE (t
) == ARRAY_RANGE_REF
)
3779 while (((TREE_CODE (t
) == ARRAY_REF
|| TREE_CODE (t
) == ARRAY_RANGE_REF
)
3780 && is_gimple_min_invariant (TREE_OPERAND (t
, 1))
3781 && (!TREE_OPERAND (t
, 2)
3782 || is_gimple_min_invariant (TREE_OPERAND (t
, 2))))
3783 || (TREE_CODE (t
) == COMPONENT_REF
3784 && (!TREE_OPERAND (t
,2)
3785 || is_gimple_min_invariant (TREE_OPERAND (t
, 2))))
3786 || TREE_CODE (t
) == BIT_FIELD_REF
3787 || TREE_CODE (t
) == REALPART_EXPR
3788 || TREE_CODE (t
) == IMAGPART_EXPR
3789 || TREE_CODE (t
) == VIEW_CONVERT_EXPR
3790 || CONVERT_EXPR_P (t
))
3791 t
= TREE_OPERAND (t
, 0);
3793 if (TREE_CODE (t
) == ARRAY_REF
|| TREE_CODE (t
) == ARRAY_RANGE_REF
)
3795 t
= get_base_address (t
);
3797 && DECL_MODE (t
) != BLKmode
)
3798 TREE_ADDRESSABLE (t
) = 1;
3807 /* RTL expansion is not able to compile array references with variable
3808 offsets for arrays stored in single register. Discover such
3809 expressions and mark variables as addressable to avoid this
3813 discover_nonconstant_array_refs (void)
3816 gimple_stmt_iterator gsi
;
3819 for (gsi
= gsi_start_bb (bb
); !gsi_end_p (gsi
); gsi_next (&gsi
))
3821 gimple stmt
= gsi_stmt (gsi
);
3822 if (!is_gimple_debug (stmt
))
3823 walk_gimple_op (stmt
, discover_nonconstant_array_refs_r
, NULL
);
3827 /* This function sets crtl->args.internal_arg_pointer to a virtual
3828 register if DRAP is needed. Local register allocator will replace
3829 virtual_incoming_args_rtx with the virtual register. */
3832 expand_stack_alignment (void)
3835 unsigned int preferred_stack_boundary
;
3837 if (! SUPPORTS_STACK_ALIGNMENT
)
3840 if (cfun
->calls_alloca
3841 || cfun
->has_nonlocal_label
3842 || crtl
->has_nonlocal_goto
)
3843 crtl
->need_drap
= true;
3845 /* Call update_stack_boundary here again to update incoming stack
3846 boundary. It may set incoming stack alignment to a different
3847 value after RTL expansion. TARGET_FUNCTION_OK_FOR_SIBCALL may
3848 use the minimum incoming stack alignment to check if it is OK
3849 to perform sibcall optimization since sibcall optimization will
3850 only align the outgoing stack to incoming stack boundary. */
3851 if (targetm
.calls
.update_stack_boundary
)
3852 targetm
.calls
.update_stack_boundary ();
3854 /* The incoming stack frame has to be aligned at least at
3855 parm_stack_boundary. */
3856 gcc_assert (crtl
->parm_stack_boundary
<= INCOMING_STACK_BOUNDARY
);
3858 /* Update crtl->stack_alignment_estimated and use it later to align
3859 stack. We check PREFERRED_STACK_BOUNDARY if there may be non-call
3860 exceptions since callgraph doesn't collect incoming stack alignment
3862 if (cfun
->can_throw_non_call_exceptions
3863 && PREFERRED_STACK_BOUNDARY
> crtl
->preferred_stack_boundary
)
3864 preferred_stack_boundary
= PREFERRED_STACK_BOUNDARY
;
3866 preferred_stack_boundary
= crtl
->preferred_stack_boundary
;
3867 if (preferred_stack_boundary
> crtl
->stack_alignment_estimated
)
3868 crtl
->stack_alignment_estimated
= preferred_stack_boundary
;
3869 if (preferred_stack_boundary
> crtl
->stack_alignment_needed
)
3870 crtl
->stack_alignment_needed
= preferred_stack_boundary
;
3872 gcc_assert (crtl
->stack_alignment_needed
3873 <= crtl
->stack_alignment_estimated
);
3875 crtl
->stack_realign_needed
3876 = INCOMING_STACK_BOUNDARY
< crtl
->stack_alignment_estimated
;
3877 crtl
->stack_realign_tried
= crtl
->stack_realign_needed
;
3879 crtl
->stack_realign_processed
= true;
3881 /* Target has to redefine TARGET_GET_DRAP_RTX to support stack
3883 gcc_assert (targetm
.calls
.get_drap_rtx
!= NULL
);
3884 drap_rtx
= targetm
.calls
.get_drap_rtx ();
3886 /* stack_realign_drap and drap_rtx must match. */
3887 gcc_assert ((stack_realign_drap
!= 0) == (drap_rtx
!= NULL
));
3889 /* Do nothing if NULL is returned, which means DRAP is not needed. */
3890 if (NULL
!= drap_rtx
)
3892 crtl
->args
.internal_arg_pointer
= drap_rtx
;
3894 /* Call fixup_tail_calls to clean up REG_EQUIV note if DRAP is
3896 fixup_tail_calls ();
3900 /* Translate the intermediate representation contained in the CFG
3901 from GIMPLE trees to RTL.
3903 We do conversion per basic block and preserve/update the tree CFG.
3904 This implies we have to do some magic as the CFG can simultaneously
3905 consist of basic blocks containing RTL and GIMPLE trees. This can
3906 confuse the CFG hooks, so be careful to not manipulate CFG during
3910 gimple_expand_cfg (void)
3912 basic_block bb
, init_block
;
3919 timevar_push (TV_OUT_OF_SSA
);
3920 rewrite_out_of_ssa (&SA
);
3921 timevar_pop (TV_OUT_OF_SSA
);
3922 SA
.partition_to_pseudo
= (rtx
*)xcalloc (SA
.map
->num_partitions
,
3925 /* Some backends want to know that we are expanding to RTL. */
3926 currently_expanding_to_rtl
= 1;
3928 rtl_profile_for_bb (ENTRY_BLOCK_PTR
);
3930 insn_locators_alloc ();
3931 if (!DECL_IS_BUILTIN (current_function_decl
))
3933 /* Eventually, all FEs should explicitly set function_start_locus. */
3934 if (cfun
->function_start_locus
== UNKNOWN_LOCATION
)
3935 set_curr_insn_source_location
3936 (DECL_SOURCE_LOCATION (current_function_decl
));
3938 set_curr_insn_source_location (cfun
->function_start_locus
);
3941 set_curr_insn_source_location (UNKNOWN_LOCATION
);
3942 set_curr_insn_block (DECL_INITIAL (current_function_decl
));
3943 prologue_locator
= curr_insn_locator ();
3945 #ifdef INSN_SCHEDULING
3946 init_sched_attrs ();
3949 /* Make sure first insn is a note even if we don't want linenums.
3950 This makes sure the first insn will never be deleted.
3951 Also, final expects a note to appear there. */
3952 emit_note (NOTE_INSN_DELETED
);
3954 /* Mark arrays indexed with non-constant indices with TREE_ADDRESSABLE. */
3955 discover_nonconstant_array_refs ();
3957 targetm
.expand_to_rtl_hook ();
3958 crtl
->stack_alignment_needed
= STACK_BOUNDARY
;
3959 crtl
->max_used_stack_slot_alignment
= STACK_BOUNDARY
;
3960 crtl
->stack_alignment_estimated
= 0;
3961 crtl
->preferred_stack_boundary
= STACK_BOUNDARY
;
3962 cfun
->cfg
->max_jumptable_ents
= 0;
3964 /* Resovle the function section. Some targets, like ARM EABI rely on knowledge
3965 of the function section at exapnsion time to predict distance of calls. */
3966 resolve_unique_section (current_function_decl
, 0, flag_function_sections
);
3968 /* Expand the variables recorded during gimple lowering. */
3969 timevar_push (TV_VAR_EXPAND
);
3972 expand_used_vars ();
3974 var_seq
= get_insns ();
3976 timevar_pop (TV_VAR_EXPAND
);
3978 /* Honor stack protection warnings. */
3979 if (warn_stack_protect
)
3981 if (cfun
->calls_alloca
)
3982 warning (OPT_Wstack_protector
,
3983 "stack protector not protecting local variables: "
3984 "variable length buffer");
3985 if (has_short_buffer
&& !crtl
->stack_protect_guard
)
3986 warning (OPT_Wstack_protector
,
3987 "stack protector not protecting function: "
3988 "all local arrays are less than %d bytes long",
3989 (int) PARAM_VALUE (PARAM_SSP_BUFFER_SIZE
));
3992 /* Set up parameters and prepare for return, for the function. */
3993 expand_function_start (current_function_decl
);
3995 /* If we emitted any instructions for setting up the variables,
3996 emit them before the FUNCTION_START note. */
3999 emit_insn_before (var_seq
, parm_birth_insn
);
4001 /* In expand_function_end we'll insert the alloca save/restore
4002 before parm_birth_insn. We've just insertted an alloca call.
4003 Adjust the pointer to match. */
4004 parm_birth_insn
= var_seq
;
4007 /* Now that we also have the parameter RTXs, copy them over to our
4009 for (i
= 0; i
< SA
.map
->num_partitions
; i
++)
4011 tree var
= SSA_NAME_VAR (partition_to_var (SA
.map
, i
));
4013 if (TREE_CODE (var
) != VAR_DECL
4014 && !SA
.partition_to_pseudo
[i
])
4015 SA
.partition_to_pseudo
[i
] = DECL_RTL_IF_SET (var
);
4016 gcc_assert (SA
.partition_to_pseudo
[i
]);
4018 /* If this decl was marked as living in multiple places, reset
4019 this now to NULL. */
4020 if (DECL_RTL_IF_SET (var
) == pc_rtx
)
4021 SET_DECL_RTL (var
, NULL
);
4023 /* Some RTL parts really want to look at DECL_RTL(x) when x
4024 was a decl marked in REG_ATTR or MEM_ATTR. We could use
4025 SET_DECL_RTL here making this available, but that would mean
4026 to select one of the potentially many RTLs for one DECL. Instead
4027 of doing that we simply reset the MEM_EXPR of the RTL in question,
4028 then nobody can get at it and hence nobody can call DECL_RTL on it. */
4029 if (!DECL_RTL_SET_P (var
))
4031 if (MEM_P (SA
.partition_to_pseudo
[i
]))
4032 set_mem_expr (SA
.partition_to_pseudo
[i
], NULL
);
4036 /* If this function is `main', emit a call to `__main'
4037 to run global initializers, etc. */
4038 if (DECL_NAME (current_function_decl
)
4039 && MAIN_NAME_P (DECL_NAME (current_function_decl
))
4040 && DECL_FILE_SCOPE_P (current_function_decl
))
4041 expand_main_function ();
4043 /* Initialize the stack_protect_guard field. This must happen after the
4044 call to __main (if any) so that the external decl is initialized. */
4045 if (crtl
->stack_protect_guard
)
4046 stack_protect_prologue ();
4048 expand_phi_nodes (&SA
);
4050 /* Register rtl specific functions for cfg. */
4051 rtl_register_cfg_hooks ();
4053 init_block
= construct_init_block ();
4055 /* Clear EDGE_EXECUTABLE on the entry edge(s). It is cleaned from the
4056 remaining edges later. */
4057 FOR_EACH_EDGE (e
, ei
, ENTRY_BLOCK_PTR
->succs
)
4058 e
->flags
&= ~EDGE_EXECUTABLE
;
4060 lab_rtx_for_bb
= pointer_map_create ();
4061 FOR_BB_BETWEEN (bb
, init_block
->next_bb
, EXIT_BLOCK_PTR
, next_bb
)
4062 bb
= expand_gimple_basic_block (bb
);
4064 if (MAY_HAVE_DEBUG_INSNS
)
4065 expand_debug_locations ();
4067 execute_free_datastructures ();
4068 timevar_push (TV_OUT_OF_SSA
);
4069 finish_out_of_ssa (&SA
);
4070 timevar_pop (TV_OUT_OF_SSA
);
4072 timevar_push (TV_POST_EXPAND
);
4073 /* We are no longer in SSA form. */
4074 cfun
->gimple_df
->in_ssa_p
= false;
4076 /* Expansion is used by optimization passes too, set maybe_hot_insn_p
4077 conservatively to true until they are all profile aware. */
4078 pointer_map_destroy (lab_rtx_for_bb
);
4081 construct_exit_block ();
4082 set_curr_insn_block (DECL_INITIAL (current_function_decl
));
4083 insn_locators_finalize ();
4085 /* Zap the tree EH table. */
4086 set_eh_throw_stmt_table (cfun
, NULL
);
4088 rebuild_jump_labels (get_insns ());
4090 FOR_BB_BETWEEN (bb
, ENTRY_BLOCK_PTR
, EXIT_BLOCK_PTR
, next_bb
)
4094 for (ei
= ei_start (bb
->succs
); (e
= ei_safe_edge (ei
)); )
4098 /* Avoid putting insns before parm_birth_insn. */
4099 if (e
->src
== ENTRY_BLOCK_PTR
4100 && single_succ_p (ENTRY_BLOCK_PTR
)
4103 rtx insns
= e
->insns
.r
;
4104 e
->insns
.r
= NULL_RTX
;
4105 emit_insn_after_noloc (insns
, parm_birth_insn
, e
->dest
);
4108 commit_one_edge_insertion (e
);
4115 /* We're done expanding trees to RTL. */
4116 currently_expanding_to_rtl
= 0;
4118 FOR_BB_BETWEEN (bb
, ENTRY_BLOCK_PTR
->next_bb
, EXIT_BLOCK_PTR
, next_bb
)
4122 for (ei
= ei_start (bb
->succs
); (e
= ei_safe_edge (ei
)); )
4124 /* Clear EDGE_EXECUTABLE. This flag is never used in the backend. */
4125 e
->flags
&= ~EDGE_EXECUTABLE
;
4127 /* At the moment not all abnormal edges match the RTL
4128 representation. It is safe to remove them here as
4129 find_many_sub_basic_blocks will rediscover them.
4130 In the future we should get this fixed properly. */
4131 if ((e
->flags
& EDGE_ABNORMAL
)
4132 && !(e
->flags
& EDGE_SIBCALL
))
4139 blocks
= sbitmap_alloc (last_basic_block
);
4140 sbitmap_ones (blocks
);
4141 find_many_sub_basic_blocks (blocks
);
4142 sbitmap_free (blocks
);
4143 purge_all_dead_edges ();
4147 expand_stack_alignment ();
4149 #ifdef ENABLE_CHECKING
4150 verify_flow_info ();
4153 /* There's no need to defer outputting this function any more; we
4154 know we want to output it. */
4155 DECL_DEFER_OUTPUT (current_function_decl
) = 0;
4157 /* Now that we're done expanding trees to RTL, we shouldn't have any
4158 more CONCATs anywhere. */
4159 generating_concat_p
= 0;
4164 "\n\n;;\n;; Full RTL generated for this function:\n;;\n");
4165 /* And the pass manager will dump RTL for us. */
4168 /* If we're emitting a nested function, make sure its parent gets
4169 emitted as well. Doing otherwise confuses debug info. */
4172 for (parent
= DECL_CONTEXT (current_function_decl
);
4173 parent
!= NULL_TREE
;
4174 parent
= get_containing_scope (parent
))
4175 if (TREE_CODE (parent
) == FUNCTION_DECL
)
4176 TREE_SYMBOL_REFERENCED (DECL_ASSEMBLER_NAME (parent
)) = 1;
4179 /* We are now committed to emitting code for this function. Do any
4180 preparation, such as emitting abstract debug info for the inline
4181 before it gets mangled by optimization. */
4182 if (cgraph_function_possibly_inlined_p (current_function_decl
))
4183 (*debug_hooks
->outlining_inline_function
) (current_function_decl
);
4185 TREE_ASM_WRITTEN (current_function_decl
) = 1;
4187 /* After expanding, the return labels are no longer needed. */
4188 return_label
= NULL
;
4189 naked_return_label
= NULL
;
4190 /* Tag the blocks with a depth number so that change_scope can find
4191 the common parent easily. */
4192 set_block_levels (DECL_INITIAL (cfun
->decl
), 0);
4193 default_rtl_profile ();
4194 timevar_pop (TV_POST_EXPAND
);
4198 struct rtl_opt_pass pass_expand
=
4202 "expand", /* name */
4204 gimple_expand_cfg
, /* execute */
4207 0, /* static_pass_number */
4208 TV_EXPAND
, /* tv_id */
4209 PROP_ssa
| PROP_gimple_leh
| PROP_cfg
4210 | PROP_gimple_lcx
, /* properties_required */
4211 PROP_rtl
, /* properties_provided */
4212 PROP_ssa
| PROP_trees
, /* properties_destroyed */
4213 TODO_verify_ssa
| TODO_verify_flow
4214 | TODO_verify_stmts
, /* todo_flags_start */
4216 | TODO_ggc_collect
/* todo_flags_finish */