[AArch64] Use new target pass registration framework for FMA steering pass
[official-gcc.git] / gcc / dce.c
blob154469c2f0a263b639bc8f5a14457b2fd35769a6
1 /* RTL dead code elimination.
2 Copyright (C) 2005-2016 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "backend.h"
24 #include "rtl.h"
25 #include "tree.h"
26 #include "predict.h"
27 #include "df.h"
28 #include "memmodel.h"
29 #include "tm_p.h"
30 #include "emit-rtl.h" /* FIXME: Can go away once crtl is moved to rtl.h. */
31 #include "cfgrtl.h"
32 #include "cfgbuild.h"
33 #include "cfgcleanup.h"
34 #include "dce.h"
35 #include "valtrack.h"
36 #include "tree-pass.h"
37 #include "dbgcnt.h"
40 /* -------------------------------------------------------------------------
41 Core mark/delete routines
42 ------------------------------------------------------------------------- */
44 /* True if we are invoked while the df engine is running; in this case,
45 we don't want to reenter it. */
46 static bool df_in_progress = false;
48 /* True if we are allowed to alter the CFG in this pass. */
49 static bool can_alter_cfg = false;
51 /* Instructions that have been marked but whose dependencies have not
52 yet been processed. */
53 static vec<rtx_insn *> worklist;
55 /* Bitmap of instructions marked as needed indexed by INSN_UID. */
56 static sbitmap marked;
58 /* Bitmap obstacks used for block processing by the fast algorithm. */
59 static bitmap_obstack dce_blocks_bitmap_obstack;
60 static bitmap_obstack dce_tmp_bitmap_obstack;
62 static bool find_call_stack_args (rtx_call_insn *, bool, bool, bitmap);
64 /* A subroutine for which BODY is part of the instruction being tested;
65 either the top-level pattern, or an element of a PARALLEL. The
66 instruction is known not to be a bare USE or CLOBBER. */
68 static bool
69 deletable_insn_p_1 (rtx body)
71 switch (GET_CODE (body))
73 case PREFETCH:
74 case TRAP_IF:
75 /* The UNSPEC case was added here because the ia-64 claims that
76 USEs do not work after reload and generates UNSPECS rather
77 than USEs. Since dce is run after reload we need to avoid
78 deleting these even if they are dead. If it turns out that
79 USEs really do work after reload, the ia-64 should be
80 changed, and the UNSPEC case can be removed. */
81 case UNSPEC:
82 return false;
84 default:
85 return !volatile_refs_p (body);
90 /* Return true if INSN is a normal instruction that can be deleted by
91 the DCE pass. */
93 static bool
94 deletable_insn_p (rtx_insn *insn, bool fast, bitmap arg_stores)
96 rtx body, x;
97 int i;
98 df_ref def;
100 if (CALL_P (insn)
101 /* We cannot delete calls inside of the recursive dce because
102 this may cause basic blocks to be deleted and this messes up
103 the rest of the stack of optimization passes. */
104 && (!df_in_progress)
105 /* We cannot delete pure or const sibling calls because it is
106 hard to see the result. */
107 && (!SIBLING_CALL_P (insn))
108 /* We can delete dead const or pure calls as long as they do not
109 infinite loop. */
110 && (RTL_CONST_OR_PURE_CALL_P (insn)
111 && !RTL_LOOPING_CONST_OR_PURE_CALL_P (insn)))
112 return find_call_stack_args (as_a <rtx_call_insn *> (insn), false,
113 fast, arg_stores);
115 /* Don't delete jumps, notes and the like. */
116 if (!NONJUMP_INSN_P (insn))
117 return false;
119 /* Don't delete insns that may throw if we cannot do so. */
120 if (!(cfun->can_delete_dead_exceptions && can_alter_cfg)
121 && !insn_nothrow_p (insn))
122 return false;
124 /* If INSN sets a global_reg, leave it untouched. */
125 FOR_EACH_INSN_DEF (def, insn)
126 if (HARD_REGISTER_NUM_P (DF_REF_REGNO (def))
127 && global_regs[DF_REF_REGNO (def)])
128 return false;
129 /* Initialization of pseudo PIC register should never be removed. */
130 else if (DF_REF_REG (def) == pic_offset_table_rtx
131 && REGNO (pic_offset_table_rtx) >= FIRST_PSEUDO_REGISTER)
132 return false;
134 body = PATTERN (insn);
135 switch (GET_CODE (body))
137 case USE:
138 case VAR_LOCATION:
139 return false;
141 case CLOBBER:
142 if (fast)
144 /* A CLOBBER of a dead pseudo register serves no purpose.
145 That is not necessarily true for hard registers until
146 after reload. */
147 x = XEXP (body, 0);
148 return REG_P (x) && (!HARD_REGISTER_P (x) || reload_completed);
150 else
151 /* Because of the way that use-def chains are built, it is not
152 possible to tell if the clobber is dead because it can
153 never be the target of a use-def chain. */
154 return false;
156 case PARALLEL:
157 for (i = XVECLEN (body, 0) - 1; i >= 0; i--)
158 if (!deletable_insn_p_1 (XVECEXP (body, 0, i)))
159 return false;
160 return true;
162 default:
163 return deletable_insn_p_1 (body);
168 /* Return true if INSN has been marked as needed. */
170 static inline int
171 marked_insn_p (rtx_insn *insn)
173 /* Artificial defs are always needed and they do not have an insn.
174 We should never see them here. */
175 gcc_assert (insn);
176 return bitmap_bit_p (marked, INSN_UID (insn));
180 /* If INSN has not yet been marked as needed, mark it now, and add it to
181 the worklist. */
183 static void
184 mark_insn (rtx_insn *insn, bool fast)
186 if (!marked_insn_p (insn))
188 if (!fast)
189 worklist.safe_push (insn);
190 bitmap_set_bit (marked, INSN_UID (insn));
191 if (dump_file)
192 fprintf (dump_file, " Adding insn %d to worklist\n", INSN_UID (insn));
193 if (CALL_P (insn)
194 && !df_in_progress
195 && !SIBLING_CALL_P (insn)
196 && (RTL_CONST_OR_PURE_CALL_P (insn)
197 && !RTL_LOOPING_CONST_OR_PURE_CALL_P (insn)))
198 find_call_stack_args (as_a <rtx_call_insn *> (insn), true, fast, NULL);
203 /* A note_stores callback used by mark_nonreg_stores. DATA is the
204 instruction containing DEST. */
206 static void
207 mark_nonreg_stores_1 (rtx dest, const_rtx pattern, void *data)
209 if (GET_CODE (pattern) != CLOBBER && !REG_P (dest))
210 mark_insn ((rtx_insn *) data, true);
214 /* A note_stores callback used by mark_nonreg_stores. DATA is the
215 instruction containing DEST. */
217 static void
218 mark_nonreg_stores_2 (rtx dest, const_rtx pattern, void *data)
220 if (GET_CODE (pattern) != CLOBBER && !REG_P (dest))
221 mark_insn ((rtx_insn *) data, false);
225 /* Mark INSN if BODY stores to a non-register destination. */
227 static void
228 mark_nonreg_stores (rtx body, rtx_insn *insn, bool fast)
230 if (fast)
231 note_stores (body, mark_nonreg_stores_1, insn);
232 else
233 note_stores (body, mark_nonreg_stores_2, insn);
237 /* Return true if store to MEM, starting OFF bytes from stack pointer,
238 is a call argument store, and clear corresponding bits from SP_BYTES
239 bitmap if it is. */
241 static bool
242 check_argument_store (rtx mem, HOST_WIDE_INT off, HOST_WIDE_INT min_sp_off,
243 HOST_WIDE_INT max_sp_off, bitmap sp_bytes)
245 HOST_WIDE_INT byte;
246 for (byte = off; byte < off + GET_MODE_SIZE (GET_MODE (mem)); byte++)
248 if (byte < min_sp_off
249 || byte >= max_sp_off
250 || !bitmap_clear_bit (sp_bytes, byte - min_sp_off))
251 return false;
253 return true;
257 /* Try to find all stack stores of CALL_INSN arguments if
258 ACCUMULATE_OUTGOING_ARGS. If all stack stores have been found
259 and it is therefore safe to eliminate the call, return true,
260 otherwise return false. This function should be first called
261 with DO_MARK false, and only when the CALL_INSN is actually
262 going to be marked called again with DO_MARK true. */
264 static bool
265 find_call_stack_args (rtx_call_insn *call_insn, bool do_mark, bool fast,
266 bitmap arg_stores)
268 rtx p;
269 rtx_insn *insn, *prev_insn;
270 bool ret;
271 HOST_WIDE_INT min_sp_off, max_sp_off;
272 bitmap sp_bytes;
274 gcc_assert (CALL_P (call_insn));
275 if (!ACCUMULATE_OUTGOING_ARGS)
276 return true;
278 if (!do_mark)
280 gcc_assert (arg_stores);
281 bitmap_clear (arg_stores);
284 min_sp_off = INTTYPE_MAXIMUM (HOST_WIDE_INT);
285 max_sp_off = 0;
287 /* First determine the minimum and maximum offset from sp for
288 stored arguments. */
289 for (p = CALL_INSN_FUNCTION_USAGE (call_insn); p; p = XEXP (p, 1))
290 if (GET_CODE (XEXP (p, 0)) == USE
291 && MEM_P (XEXP (XEXP (p, 0), 0)))
293 rtx mem = XEXP (XEXP (p, 0), 0), addr;
294 HOST_WIDE_INT off = 0, size;
295 if (!MEM_SIZE_KNOWN_P (mem))
296 return false;
297 size = MEM_SIZE (mem);
298 addr = XEXP (mem, 0);
299 if (GET_CODE (addr) == PLUS
300 && REG_P (XEXP (addr, 0))
301 && CONST_INT_P (XEXP (addr, 1)))
303 off = INTVAL (XEXP (addr, 1));
304 addr = XEXP (addr, 0);
306 if (addr != stack_pointer_rtx)
308 if (!REG_P (addr))
309 return false;
310 /* If not fast, use chains to see if addr wasn't set to
311 sp + offset. */
312 if (!fast)
314 df_ref use;
315 struct df_link *defs;
316 rtx set;
318 FOR_EACH_INSN_USE (use, call_insn)
319 if (rtx_equal_p (addr, DF_REF_REG (use)))
320 break;
322 if (use == NULL)
323 return false;
325 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
326 if (! DF_REF_IS_ARTIFICIAL (defs->ref))
327 break;
329 if (defs == NULL)
330 return false;
332 set = single_set (DF_REF_INSN (defs->ref));
333 if (!set)
334 return false;
336 if (GET_CODE (SET_SRC (set)) != PLUS
337 || XEXP (SET_SRC (set), 0) != stack_pointer_rtx
338 || !CONST_INT_P (XEXP (SET_SRC (set), 1)))
339 return false;
341 off += INTVAL (XEXP (SET_SRC (set), 1));
343 else
344 return false;
346 min_sp_off = MIN (min_sp_off, off);
347 max_sp_off = MAX (max_sp_off, off + size);
350 if (min_sp_off >= max_sp_off)
351 return true;
352 sp_bytes = BITMAP_ALLOC (NULL);
354 /* Set bits in SP_BYTES bitmap for bytes relative to sp + min_sp_off
355 which contain arguments. Checking has been done in the previous
356 loop. */
357 for (p = CALL_INSN_FUNCTION_USAGE (call_insn); p; p = XEXP (p, 1))
358 if (GET_CODE (XEXP (p, 0)) == USE
359 && MEM_P (XEXP (XEXP (p, 0), 0)))
361 rtx mem = XEXP (XEXP (p, 0), 0), addr;
362 HOST_WIDE_INT off = 0, byte;
363 addr = XEXP (mem, 0);
364 if (GET_CODE (addr) == PLUS
365 && REG_P (XEXP (addr, 0))
366 && CONST_INT_P (XEXP (addr, 1)))
368 off = INTVAL (XEXP (addr, 1));
369 addr = XEXP (addr, 0);
371 if (addr != stack_pointer_rtx)
373 df_ref use;
374 struct df_link *defs;
375 rtx set;
377 FOR_EACH_INSN_USE (use, call_insn)
378 if (rtx_equal_p (addr, DF_REF_REG (use)))
379 break;
381 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
382 if (! DF_REF_IS_ARTIFICIAL (defs->ref))
383 break;
385 set = single_set (DF_REF_INSN (defs->ref));
386 off += INTVAL (XEXP (SET_SRC (set), 1));
388 for (byte = off; byte < off + MEM_SIZE (mem); byte++)
390 if (!bitmap_set_bit (sp_bytes, byte - min_sp_off))
391 gcc_unreachable ();
395 /* Walk backwards, looking for argument stores. The search stops
396 when seeing another call, sp adjustment or memory store other than
397 argument store. */
398 ret = false;
399 for (insn = PREV_INSN (call_insn); insn; insn = prev_insn)
401 rtx set, mem, addr;
402 HOST_WIDE_INT off;
404 if (insn == BB_HEAD (BLOCK_FOR_INSN (call_insn)))
405 prev_insn = NULL;
406 else
407 prev_insn = PREV_INSN (insn);
409 if (CALL_P (insn))
410 break;
412 if (!NONDEBUG_INSN_P (insn))
413 continue;
415 set = single_set (insn);
416 if (!set || SET_DEST (set) == stack_pointer_rtx)
417 break;
419 if (!MEM_P (SET_DEST (set)))
420 continue;
422 mem = SET_DEST (set);
423 addr = XEXP (mem, 0);
424 off = 0;
425 if (GET_CODE (addr) == PLUS
426 && REG_P (XEXP (addr, 0))
427 && CONST_INT_P (XEXP (addr, 1)))
429 off = INTVAL (XEXP (addr, 1));
430 addr = XEXP (addr, 0);
432 if (addr != stack_pointer_rtx)
434 if (!REG_P (addr))
435 break;
436 if (!fast)
438 df_ref use;
439 struct df_link *defs;
440 rtx set;
442 FOR_EACH_INSN_USE (use, insn)
443 if (rtx_equal_p (addr, DF_REF_REG (use)))
444 break;
446 if (use == NULL)
447 break;
449 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
450 if (! DF_REF_IS_ARTIFICIAL (defs->ref))
451 break;
453 if (defs == NULL)
454 break;
456 set = single_set (DF_REF_INSN (defs->ref));
457 if (!set)
458 break;
460 if (GET_CODE (SET_SRC (set)) != PLUS
461 || XEXP (SET_SRC (set), 0) != stack_pointer_rtx
462 || !CONST_INT_P (XEXP (SET_SRC (set), 1)))
463 break;
465 off += INTVAL (XEXP (SET_SRC (set), 1));
467 else
468 break;
471 if (GET_MODE_SIZE (GET_MODE (mem)) == 0
472 || !check_argument_store (mem, off, min_sp_off,
473 max_sp_off, sp_bytes))
474 break;
476 if (!deletable_insn_p (insn, fast, NULL))
477 break;
479 if (do_mark)
480 mark_insn (insn, fast);
481 else
482 bitmap_set_bit (arg_stores, INSN_UID (insn));
484 if (bitmap_empty_p (sp_bytes))
486 ret = true;
487 break;
491 BITMAP_FREE (sp_bytes);
492 if (!ret && arg_stores)
493 bitmap_clear (arg_stores);
495 return ret;
499 /* Remove all REG_EQUAL and REG_EQUIV notes referring to the registers INSN
500 writes to. */
502 static void
503 remove_reg_equal_equiv_notes_for_defs (rtx_insn *insn)
505 df_ref def;
507 FOR_EACH_INSN_DEF (def, insn)
508 remove_reg_equal_equiv_notes_for_regno (DF_REF_REGNO (def));
511 /* Scan all BBs for debug insns and reset those that reference values
512 defined in unmarked insns. */
514 static void
515 reset_unmarked_insns_debug_uses (void)
517 basic_block bb;
518 rtx_insn *insn, *next;
520 FOR_EACH_BB_REVERSE_FN (bb, cfun)
521 FOR_BB_INSNS_REVERSE_SAFE (bb, insn, next)
522 if (DEBUG_INSN_P (insn))
524 df_ref use;
526 FOR_EACH_INSN_USE (use, insn)
528 struct df_link *defs;
529 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
531 rtx_insn *ref_insn;
532 if (DF_REF_IS_ARTIFICIAL (defs->ref))
533 continue;
534 ref_insn = DF_REF_INSN (defs->ref);
535 if (!marked_insn_p (ref_insn))
536 break;
538 if (!defs)
539 continue;
540 /* ??? FIXME could we propagate the values assigned to
541 each of the DEFs? */
542 INSN_VAR_LOCATION_LOC (insn) = gen_rtx_UNKNOWN_VAR_LOC ();
543 df_insn_rescan_debug_internal (insn);
544 break;
549 /* Delete every instruction that hasn't been marked. */
551 static void
552 delete_unmarked_insns (void)
554 basic_block bb;
555 rtx_insn *insn, *next;
556 bool must_clean = false;
558 FOR_EACH_BB_REVERSE_FN (bb, cfun)
559 FOR_BB_INSNS_REVERSE_SAFE (bb, insn, next)
560 if (NONDEBUG_INSN_P (insn))
562 /* Always delete no-op moves. */
563 if (noop_move_p (insn))
566 /* Otherwise rely only on the DCE algorithm. */
567 else if (marked_insn_p (insn))
568 continue;
570 /* Beware that reaching a dbg counter limit here can result
571 in miscompiled file. This occurs when a group of insns
572 must be deleted together, typically because the kept insn
573 depends on the output from the deleted insn. Deleting
574 this insns in reverse order (both at the bb level and
575 when looking at the blocks) minimizes this, but does not
576 eliminate it, since it is possible for the using insn to
577 be top of a block and the producer to be at the bottom of
578 the block. However, in most cases this will only result
579 in an uninitialized use of an insn that is dead anyway.
581 However, there is one rare case that will cause a
582 miscompile: deletion of non-looping pure and constant
583 calls on a machine where ACCUMULATE_OUTGOING_ARGS is true.
584 In this case it is possible to remove the call, but leave
585 the argument pushes to the stack. Because of the changes
586 to the stack pointer, this will almost always lead to a
587 miscompile. */
588 if (!dbg_cnt (dce))
589 continue;
591 if (crtl->shrink_wrapped_separate
592 && find_reg_note (insn, REG_CFA_RESTORE, NULL))
594 if (dump_file)
595 fprintf (dump_file, "DCE: NOT deleting insn %d, it's a "
596 "callee-save restore\n", INSN_UID (insn));
597 continue;
600 if (dump_file)
601 fprintf (dump_file, "DCE: Deleting insn %d\n", INSN_UID (insn));
603 /* Before we delete the insn we have to remove the REG_EQUAL notes
604 for the destination regs in order to avoid dangling notes. */
605 remove_reg_equal_equiv_notes_for_defs (insn);
607 /* If a pure or const call is deleted, this may make the cfg
608 have unreachable blocks. We rememeber this and call
609 delete_unreachable_blocks at the end. */
610 if (CALL_P (insn))
611 must_clean = true;
613 /* Now delete the insn. */
614 delete_insn_and_edges (insn);
617 /* Deleted a pure or const call. */
618 if (must_clean)
619 delete_unreachable_blocks ();
623 /* Go through the instructions and mark those whose necessity is not
624 dependent on inter-instruction information. Make sure all other
625 instructions are not marked. */
627 static void
628 prescan_insns_for_dce (bool fast)
630 basic_block bb;
631 rtx_insn *insn, *prev;
632 bitmap arg_stores = NULL;
634 if (dump_file)
635 fprintf (dump_file, "Finding needed instructions:\n");
637 if (!df_in_progress && ACCUMULATE_OUTGOING_ARGS)
638 arg_stores = BITMAP_ALLOC (NULL);
640 FOR_EACH_BB_FN (bb, cfun)
642 FOR_BB_INSNS_REVERSE_SAFE (bb, insn, prev)
643 if (NONDEBUG_INSN_P (insn))
645 /* Don't mark argument stores now. They will be marked
646 if needed when the associated CALL is marked. */
647 if (arg_stores && bitmap_bit_p (arg_stores, INSN_UID (insn)))
648 continue;
649 if (deletable_insn_p (insn, fast, arg_stores))
650 mark_nonreg_stores (PATTERN (insn), insn, fast);
651 else
652 mark_insn (insn, fast);
654 /* find_call_stack_args only looks at argument stores in the
655 same bb. */
656 if (arg_stores)
657 bitmap_clear (arg_stores);
660 if (arg_stores)
661 BITMAP_FREE (arg_stores);
663 if (dump_file)
664 fprintf (dump_file, "Finished finding needed instructions:\n");
668 /* UD-based DSE routines. */
670 /* Mark instructions that define artificially-used registers, such as
671 the frame pointer and the stack pointer. */
673 static void
674 mark_artificial_uses (void)
676 basic_block bb;
677 struct df_link *defs;
678 df_ref use;
680 FOR_ALL_BB_FN (bb, cfun)
681 FOR_EACH_ARTIFICIAL_USE (use, bb->index)
682 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
683 if (!DF_REF_IS_ARTIFICIAL (defs->ref))
684 mark_insn (DF_REF_INSN (defs->ref), false);
688 /* Mark every instruction that defines a register value that INSN uses. */
690 static void
691 mark_reg_dependencies (rtx_insn *insn)
693 struct df_link *defs;
694 df_ref use;
696 if (DEBUG_INSN_P (insn))
697 return;
699 FOR_EACH_INSN_USE (use, insn)
701 if (dump_file)
703 fprintf (dump_file, "Processing use of ");
704 print_simple_rtl (dump_file, DF_REF_REG (use));
705 fprintf (dump_file, " in insn %d:\n", INSN_UID (insn));
707 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
708 if (! DF_REF_IS_ARTIFICIAL (defs->ref))
709 mark_insn (DF_REF_INSN (defs->ref), false);
714 /* Initialize global variables for a new DCE pass. */
716 static void
717 init_dce (bool fast)
719 if (!df_in_progress)
721 if (!fast)
723 df_set_flags (DF_RD_PRUNE_DEAD_DEFS);
724 df_chain_add_problem (DF_UD_CHAIN);
726 df_analyze ();
729 if (dump_file)
730 df_dump (dump_file);
732 if (fast)
734 bitmap_obstack_initialize (&dce_blocks_bitmap_obstack);
735 bitmap_obstack_initialize (&dce_tmp_bitmap_obstack);
736 can_alter_cfg = false;
738 else
739 can_alter_cfg = true;
741 marked = sbitmap_alloc (get_max_uid () + 1);
742 bitmap_clear (marked);
746 /* Free the data allocated by init_dce. */
748 static void
749 fini_dce (bool fast)
751 sbitmap_free (marked);
753 if (fast)
755 bitmap_obstack_release (&dce_blocks_bitmap_obstack);
756 bitmap_obstack_release (&dce_tmp_bitmap_obstack);
761 /* UD-chain based DCE. */
763 static unsigned int
764 rest_of_handle_ud_dce (void)
766 rtx_insn *insn;
768 init_dce (false);
770 prescan_insns_for_dce (false);
771 mark_artificial_uses ();
772 while (worklist.length () > 0)
774 insn = worklist.pop ();
775 mark_reg_dependencies (insn);
777 worklist.release ();
779 if (MAY_HAVE_DEBUG_INSNS)
780 reset_unmarked_insns_debug_uses ();
782 /* Before any insns are deleted, we must remove the chains since
783 they are not bidirectional. */
784 df_remove_problem (df_chain);
785 delete_unmarked_insns ();
787 fini_dce (false);
788 return 0;
792 namespace {
794 const pass_data pass_data_ud_rtl_dce =
796 RTL_PASS, /* type */
797 "ud_dce", /* name */
798 OPTGROUP_NONE, /* optinfo_flags */
799 TV_DCE, /* tv_id */
800 0, /* properties_required */
801 0, /* properties_provided */
802 0, /* properties_destroyed */
803 0, /* todo_flags_start */
804 TODO_df_finish, /* todo_flags_finish */
807 class pass_ud_rtl_dce : public rtl_opt_pass
809 public:
810 pass_ud_rtl_dce (gcc::context *ctxt)
811 : rtl_opt_pass (pass_data_ud_rtl_dce, ctxt)
814 /* opt_pass methods: */
815 virtual bool gate (function *)
817 return optimize > 1 && flag_dce && dbg_cnt (dce_ud);
820 virtual unsigned int execute (function *)
822 return rest_of_handle_ud_dce ();
825 }; // class pass_ud_rtl_dce
827 } // anon namespace
829 rtl_opt_pass *
830 make_pass_ud_rtl_dce (gcc::context *ctxt)
832 return new pass_ud_rtl_dce (ctxt);
836 /* -------------------------------------------------------------------------
837 Fast DCE functions
838 ------------------------------------------------------------------------- */
840 /* Process basic block BB. Return true if the live_in set has
841 changed. REDO_OUT is true if the info at the bottom of the block
842 needs to be recalculated before starting. AU is the proper set of
843 artificial uses. Track global substitution of uses of dead pseudos
844 in debug insns using GLOBAL_DEBUG. */
846 static bool
847 word_dce_process_block (basic_block bb, bool redo_out,
848 struct dead_debug_global *global_debug)
850 bitmap local_live = BITMAP_ALLOC (&dce_tmp_bitmap_obstack);
851 rtx_insn *insn;
852 bool block_changed;
853 struct dead_debug_local debug;
855 if (redo_out)
857 /* Need to redo the live_out set of this block if when one of
858 the succs of this block has had a change in it live in
859 set. */
860 edge e;
861 edge_iterator ei;
862 df_confluence_function_n con_fun_n = df_word_lr->problem->con_fun_n;
863 bitmap_clear (DF_WORD_LR_OUT (bb));
864 FOR_EACH_EDGE (e, ei, bb->succs)
865 (*con_fun_n) (e);
868 if (dump_file)
870 fprintf (dump_file, "processing block %d live out = ", bb->index);
871 df_print_word_regset (dump_file, DF_WORD_LR_OUT (bb));
874 bitmap_copy (local_live, DF_WORD_LR_OUT (bb));
875 dead_debug_local_init (&debug, NULL, global_debug);
877 FOR_BB_INSNS_REVERSE (bb, insn)
878 if (DEBUG_INSN_P (insn))
880 df_ref use;
881 FOR_EACH_INSN_USE (use, insn)
882 if (DF_REF_REGNO (use) >= FIRST_PSEUDO_REGISTER
883 && (GET_MODE_SIZE (GET_MODE (DF_REF_REAL_REG (use)))
884 == 2 * UNITS_PER_WORD)
885 && !bitmap_bit_p (local_live, 2 * DF_REF_REGNO (use))
886 && !bitmap_bit_p (local_live, 2 * DF_REF_REGNO (use) + 1))
887 dead_debug_add (&debug, use, DF_REF_REGNO (use));
889 else if (INSN_P (insn))
891 bool any_changed;
893 /* No matter if the instruction is needed or not, we remove
894 any regno in the defs from the live set. */
895 any_changed = df_word_lr_simulate_defs (insn, local_live);
896 if (any_changed)
897 mark_insn (insn, true);
899 /* On the other hand, we do not allow the dead uses to set
900 anything in local_live. */
901 if (marked_insn_p (insn))
902 df_word_lr_simulate_uses (insn, local_live);
904 /* Insert debug temps for dead REGs used in subsequent debug
905 insns. We may have to emit a debug temp even if the insn
906 was marked, in case the debug use was after the point of
907 death. */
908 if (debug.used && !bitmap_empty_p (debug.used))
910 df_ref def;
912 FOR_EACH_INSN_DEF (def, insn)
913 dead_debug_insert_temp (&debug, DF_REF_REGNO (def), insn,
914 marked_insn_p (insn)
915 && !control_flow_insn_p (insn)
916 ? DEBUG_TEMP_AFTER_WITH_REG_FORCE
917 : DEBUG_TEMP_BEFORE_WITH_VALUE);
920 if (dump_file)
922 fprintf (dump_file, "finished processing insn %d live out = ",
923 INSN_UID (insn));
924 df_print_word_regset (dump_file, local_live);
928 block_changed = !bitmap_equal_p (local_live, DF_WORD_LR_IN (bb));
929 if (block_changed)
930 bitmap_copy (DF_WORD_LR_IN (bb), local_live);
932 dead_debug_local_finish (&debug, NULL);
933 BITMAP_FREE (local_live);
934 return block_changed;
938 /* Process basic block BB. Return true if the live_in set has
939 changed. REDO_OUT is true if the info at the bottom of the block
940 needs to be recalculated before starting. AU is the proper set of
941 artificial uses. Track global substitution of uses of dead pseudos
942 in debug insns using GLOBAL_DEBUG. */
944 static bool
945 dce_process_block (basic_block bb, bool redo_out, bitmap au,
946 struct dead_debug_global *global_debug)
948 bitmap local_live = BITMAP_ALLOC (&dce_tmp_bitmap_obstack);
949 rtx_insn *insn;
950 bool block_changed;
951 df_ref def;
952 struct dead_debug_local debug;
954 if (redo_out)
956 /* Need to redo the live_out set of this block if when one of
957 the succs of this block has had a change in it live in
958 set. */
959 edge e;
960 edge_iterator ei;
961 df_confluence_function_n con_fun_n = df_lr->problem->con_fun_n;
962 bitmap_clear (DF_LR_OUT (bb));
963 FOR_EACH_EDGE (e, ei, bb->succs)
964 (*con_fun_n) (e);
967 if (dump_file)
969 fprintf (dump_file, "processing block %d lr out = ", bb->index);
970 df_print_regset (dump_file, DF_LR_OUT (bb));
973 bitmap_copy (local_live, DF_LR_OUT (bb));
975 df_simulate_initialize_backwards (bb, local_live);
976 dead_debug_local_init (&debug, NULL, global_debug);
978 FOR_BB_INSNS_REVERSE (bb, insn)
979 if (DEBUG_INSN_P (insn))
981 df_ref use;
982 FOR_EACH_INSN_USE (use, insn)
983 if (!bitmap_bit_p (local_live, DF_REF_REGNO (use))
984 && !bitmap_bit_p (au, DF_REF_REGNO (use)))
985 dead_debug_add (&debug, use, DF_REF_REGNO (use));
987 else if (INSN_P (insn))
989 bool needed = marked_insn_p (insn);
991 /* The insn is needed if there is someone who uses the output. */
992 if (!needed)
993 FOR_EACH_INSN_DEF (def, insn)
994 if (bitmap_bit_p (local_live, DF_REF_REGNO (def))
995 || bitmap_bit_p (au, DF_REF_REGNO (def)))
997 needed = true;
998 mark_insn (insn, true);
999 break;
1002 /* No matter if the instruction is needed or not, we remove
1003 any regno in the defs from the live set. */
1004 df_simulate_defs (insn, local_live);
1006 /* On the other hand, we do not allow the dead uses to set
1007 anything in local_live. */
1008 if (needed)
1009 df_simulate_uses (insn, local_live);
1011 /* Insert debug temps for dead REGs used in subsequent debug
1012 insns. We may have to emit a debug temp even if the insn
1013 was marked, in case the debug use was after the point of
1014 death. */
1015 if (debug.used && !bitmap_empty_p (debug.used))
1016 FOR_EACH_INSN_DEF (def, insn)
1017 dead_debug_insert_temp (&debug, DF_REF_REGNO (def), insn,
1018 needed && !control_flow_insn_p (insn)
1019 ? DEBUG_TEMP_AFTER_WITH_REG_FORCE
1020 : DEBUG_TEMP_BEFORE_WITH_VALUE);
1023 dead_debug_local_finish (&debug, NULL);
1024 df_simulate_finalize_backwards (bb, local_live);
1026 block_changed = !bitmap_equal_p (local_live, DF_LR_IN (bb));
1027 if (block_changed)
1028 bitmap_copy (DF_LR_IN (bb), local_live);
1030 BITMAP_FREE (local_live);
1031 return block_changed;
1035 /* Perform fast DCE once initialization is done. If WORD_LEVEL is
1036 true, use the word level dce, otherwise do it at the pseudo
1037 level. */
1039 static void
1040 fast_dce (bool word_level)
1042 int *postorder = df_get_postorder (DF_BACKWARD);
1043 int n_blocks = df_get_n_blocks (DF_BACKWARD);
1044 /* The set of blocks that have been seen on this iteration. */
1045 bitmap processed = BITMAP_ALLOC (&dce_blocks_bitmap_obstack);
1046 /* The set of blocks that need to have the out vectors reset because
1047 the in of one of their successors has changed. */
1048 bitmap redo_out = BITMAP_ALLOC (&dce_blocks_bitmap_obstack);
1049 bitmap all_blocks = BITMAP_ALLOC (&dce_blocks_bitmap_obstack);
1050 bool global_changed = true;
1052 /* These regs are considered always live so if they end up dying
1053 because of some def, we need to bring the back again. Calling
1054 df_simulate_fixup_sets has the disadvantage of calling
1055 bb_has_eh_pred once per insn, so we cache the information
1056 here. */
1057 bitmap au = &df->regular_block_artificial_uses;
1058 bitmap au_eh = &df->eh_block_artificial_uses;
1059 int i;
1060 struct dead_debug_global global_debug;
1062 prescan_insns_for_dce (true);
1064 for (i = 0; i < n_blocks; i++)
1065 bitmap_set_bit (all_blocks, postorder[i]);
1067 dead_debug_global_init (&global_debug, NULL);
1069 while (global_changed)
1071 global_changed = false;
1073 for (i = 0; i < n_blocks; i++)
1075 int index = postorder[i];
1076 basic_block bb = BASIC_BLOCK_FOR_FN (cfun, index);
1077 bool local_changed;
1079 if (index < NUM_FIXED_BLOCKS)
1081 bitmap_set_bit (processed, index);
1082 continue;
1085 if (word_level)
1086 local_changed
1087 = word_dce_process_block (bb, bitmap_bit_p (redo_out, index),
1088 &global_debug);
1089 else
1090 local_changed
1091 = dce_process_block (bb, bitmap_bit_p (redo_out, index),
1092 bb_has_eh_pred (bb) ? au_eh : au,
1093 &global_debug);
1094 bitmap_set_bit (processed, index);
1096 if (local_changed)
1098 edge e;
1099 edge_iterator ei;
1100 FOR_EACH_EDGE (e, ei, bb->preds)
1101 if (bitmap_bit_p (processed, e->src->index))
1102 /* Be tricky about when we need to iterate the
1103 analysis. We only have redo the analysis if the
1104 bitmaps change at the top of a block that is the
1105 entry to a loop. */
1106 global_changed = true;
1107 else
1108 bitmap_set_bit (redo_out, e->src->index);
1112 if (global_changed)
1114 /* Turn off the RUN_DCE flag to prevent recursive calls to
1115 dce. */
1116 int old_flag = df_clear_flags (DF_LR_RUN_DCE);
1118 /* So something was deleted that requires a redo. Do it on
1119 the cheap. */
1120 delete_unmarked_insns ();
1121 bitmap_clear (marked);
1122 bitmap_clear (processed);
1123 bitmap_clear (redo_out);
1125 /* We do not need to rescan any instructions. We only need
1126 to redo the dataflow equations for the blocks that had a
1127 change at the top of the block. Then we need to redo the
1128 iteration. */
1129 if (word_level)
1130 df_analyze_problem (df_word_lr, all_blocks, postorder, n_blocks);
1131 else
1132 df_analyze_problem (df_lr, all_blocks, postorder, n_blocks);
1134 if (old_flag & DF_LR_RUN_DCE)
1135 df_set_flags (DF_LR_RUN_DCE);
1137 prescan_insns_for_dce (true);
1141 dead_debug_global_finish (&global_debug, NULL);
1143 delete_unmarked_insns ();
1145 BITMAP_FREE (processed);
1146 BITMAP_FREE (redo_out);
1147 BITMAP_FREE (all_blocks);
1151 /* Fast register level DCE. */
1153 static unsigned int
1154 rest_of_handle_fast_dce (void)
1156 init_dce (true);
1157 fast_dce (false);
1158 fini_dce (true);
1159 return 0;
1163 /* Fast byte level DCE. */
1165 void
1166 run_word_dce (void)
1168 int old_flags;
1170 if (!flag_dce)
1171 return;
1173 timevar_push (TV_DCE);
1174 old_flags = df_clear_flags (DF_DEFER_INSN_RESCAN + DF_NO_INSN_RESCAN);
1175 df_word_lr_add_problem ();
1176 init_dce (true);
1177 fast_dce (true);
1178 fini_dce (true);
1179 df_set_flags (old_flags);
1180 timevar_pop (TV_DCE);
1184 /* This is an internal call that is used by the df live register
1185 problem to run fast dce as a side effect of creating the live
1186 information. The stack is organized so that the lr problem is run,
1187 this pass is run, which updates the live info and the df scanning
1188 info, and then returns to allow the rest of the problems to be run.
1190 This can be called by elsewhere but it will not update the bit
1191 vectors for any other problems than LR. */
1193 void
1194 run_fast_df_dce (void)
1196 if (flag_dce)
1198 /* If dce is able to delete something, it has to happen
1199 immediately. Otherwise there will be problems handling the
1200 eq_notes. */
1201 int old_flags =
1202 df_clear_flags (DF_DEFER_INSN_RESCAN + DF_NO_INSN_RESCAN);
1204 df_in_progress = true;
1205 rest_of_handle_fast_dce ();
1206 df_in_progress = false;
1208 df_set_flags (old_flags);
1213 /* Run a fast DCE pass. */
1215 void
1216 run_fast_dce (void)
1218 if (flag_dce)
1219 rest_of_handle_fast_dce ();
1223 namespace {
1225 const pass_data pass_data_fast_rtl_dce =
1227 RTL_PASS, /* type */
1228 "rtl_dce", /* name */
1229 OPTGROUP_NONE, /* optinfo_flags */
1230 TV_DCE, /* tv_id */
1231 0, /* properties_required */
1232 0, /* properties_provided */
1233 0, /* properties_destroyed */
1234 0, /* todo_flags_start */
1235 TODO_df_finish, /* todo_flags_finish */
1238 class pass_fast_rtl_dce : public rtl_opt_pass
1240 public:
1241 pass_fast_rtl_dce (gcc::context *ctxt)
1242 : rtl_opt_pass (pass_data_fast_rtl_dce, ctxt)
1245 /* opt_pass methods: */
1246 virtual bool gate (function *)
1248 return optimize > 0 && flag_dce && dbg_cnt (dce_fast);
1251 virtual unsigned int execute (function *)
1253 return rest_of_handle_fast_dce ();
1256 }; // class pass_fast_rtl_dce
1258 } // anon namespace
1260 rtl_opt_pass *
1261 make_pass_fast_rtl_dce (gcc::context *ctxt)
1263 return new pass_fast_rtl_dce (ctxt);