PR tree-optimization/66718
[official-gcc.git] / gcc / dce.c
blob0f7d35e7182f07e9df47db97cf9d8573abcfb292
1 /* RTL dead code elimination.
2 Copyright (C) 2005-2015 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "tm.h"
24 #include "rtl.h"
25 #include "alias.h"
26 #include "symtab.h"
27 #include "tree.h"
28 #include "regs.h"
29 #include "hard-reg-set.h"
30 #include "flags.h"
31 #include "except.h"
32 #include "dominance.h"
33 #include "cfg.h"
34 #include "cfgrtl.h"
35 #include "cfgbuild.h"
36 #include "cfgcleanup.h"
37 #include "predict.h"
38 #include "basic-block.h"
39 #include "df.h"
40 #include "cselib.h"
41 #include "dce.h"
42 #include "valtrack.h"
43 #include "tree-pass.h"
44 #include "dbgcnt.h"
45 #include "tm_p.h"
46 #include "emit-rtl.h" /* FIXME: Can go away once crtl is moved to rtl.h. */
49 /* -------------------------------------------------------------------------
50 Core mark/delete routines
51 ------------------------------------------------------------------------- */
53 /* True if we are invoked while the df engine is running; in this case,
54 we don't want to reenter it. */
55 static bool df_in_progress = false;
57 /* True if we are allowed to alter the CFG in this pass. */
58 static bool can_alter_cfg = false;
60 /* Instructions that have been marked but whose dependencies have not
61 yet been processed. */
62 static vec<rtx_insn *> worklist;
64 /* Bitmap of instructions marked as needed indexed by INSN_UID. */
65 static sbitmap marked;
67 /* Bitmap obstacks used for block processing by the fast algorithm. */
68 static bitmap_obstack dce_blocks_bitmap_obstack;
69 static bitmap_obstack dce_tmp_bitmap_obstack;
71 static bool find_call_stack_args (rtx_call_insn *, bool, bool, bitmap);
73 /* A subroutine for which BODY is part of the instruction being tested;
74 either the top-level pattern, or an element of a PARALLEL. The
75 instruction is known not to be a bare USE or CLOBBER. */
77 static bool
78 deletable_insn_p_1 (rtx body)
80 switch (GET_CODE (body))
82 case PREFETCH:
83 case TRAP_IF:
84 /* The UNSPEC case was added here because the ia-64 claims that
85 USEs do not work after reload and generates UNSPECS rather
86 than USEs. Since dce is run after reload we need to avoid
87 deleting these even if they are dead. If it turns out that
88 USEs really do work after reload, the ia-64 should be
89 changed, and the UNSPEC case can be removed. */
90 case UNSPEC:
91 return false;
93 default:
94 return !volatile_refs_p (body);
99 /* Return true if INSN is a normal instruction that can be deleted by
100 the DCE pass. */
102 static bool
103 deletable_insn_p (rtx_insn *insn, bool fast, bitmap arg_stores)
105 rtx body, x;
106 int i;
107 df_ref def;
109 if (CALL_P (insn)
110 /* We cannot delete calls inside of the recursive dce because
111 this may cause basic blocks to be deleted and this messes up
112 the rest of the stack of optimization passes. */
113 && (!df_in_progress)
114 /* We cannot delete pure or const sibling calls because it is
115 hard to see the result. */
116 && (!SIBLING_CALL_P (insn))
117 /* We can delete dead const or pure calls as long as they do not
118 infinite loop. */
119 && (RTL_CONST_OR_PURE_CALL_P (insn)
120 && !RTL_LOOPING_CONST_OR_PURE_CALL_P (insn)))
121 return find_call_stack_args (as_a <rtx_call_insn *> (insn), false,
122 fast, arg_stores);
124 /* Don't delete jumps, notes and the like. */
125 if (!NONJUMP_INSN_P (insn))
126 return false;
128 /* Don't delete insns that may throw if we cannot do so. */
129 if (!(cfun->can_delete_dead_exceptions && can_alter_cfg)
130 && !insn_nothrow_p (insn))
131 return false;
133 /* If INSN sets a global_reg, leave it untouched. */
134 FOR_EACH_INSN_DEF (def, insn)
135 if (HARD_REGISTER_NUM_P (DF_REF_REGNO (def))
136 && global_regs[DF_REF_REGNO (def)])
137 return false;
138 /* Initialization of pseudo PIC register should never be removed. */
139 else if (DF_REF_REG (def) == pic_offset_table_rtx
140 && REGNO (pic_offset_table_rtx) >= FIRST_PSEUDO_REGISTER)
141 return false;
143 body = PATTERN (insn);
144 switch (GET_CODE (body))
146 case USE:
147 case VAR_LOCATION:
148 return false;
150 case CLOBBER:
151 if (fast)
153 /* A CLOBBER of a dead pseudo register serves no purpose.
154 That is not necessarily true for hard registers until
155 after reload. */
156 x = XEXP (body, 0);
157 return REG_P (x) && (!HARD_REGISTER_P (x) || reload_completed);
159 else
160 /* Because of the way that use-def chains are built, it is not
161 possible to tell if the clobber is dead because it can
162 never be the target of a use-def chain. */
163 return false;
165 case PARALLEL:
166 for (i = XVECLEN (body, 0) - 1; i >= 0; i--)
167 if (!deletable_insn_p_1 (XVECEXP (body, 0, i)))
168 return false;
169 return true;
171 default:
172 return deletable_insn_p_1 (body);
177 /* Return true if INSN has been marked as needed. */
179 static inline int
180 marked_insn_p (rtx_insn *insn)
182 /* Artificial defs are always needed and they do not have an insn.
183 We should never see them here. */
184 gcc_assert (insn);
185 return bitmap_bit_p (marked, INSN_UID (insn));
189 /* If INSN has not yet been marked as needed, mark it now, and add it to
190 the worklist. */
192 static void
193 mark_insn (rtx_insn *insn, bool fast)
195 if (!marked_insn_p (insn))
197 if (!fast)
198 worklist.safe_push (insn);
199 bitmap_set_bit (marked, INSN_UID (insn));
200 if (dump_file)
201 fprintf (dump_file, " Adding insn %d to worklist\n", INSN_UID (insn));
202 if (CALL_P (insn)
203 && !df_in_progress
204 && !SIBLING_CALL_P (insn)
205 && (RTL_CONST_OR_PURE_CALL_P (insn)
206 && !RTL_LOOPING_CONST_OR_PURE_CALL_P (insn)))
207 find_call_stack_args (as_a <rtx_call_insn *> (insn), true, fast, NULL);
212 /* A note_stores callback used by mark_nonreg_stores. DATA is the
213 instruction containing DEST. */
215 static void
216 mark_nonreg_stores_1 (rtx dest, const_rtx pattern, void *data)
218 if (GET_CODE (pattern) != CLOBBER && !REG_P (dest))
219 mark_insn ((rtx_insn *) data, true);
223 /* A note_stores callback used by mark_nonreg_stores. DATA is the
224 instruction containing DEST. */
226 static void
227 mark_nonreg_stores_2 (rtx dest, const_rtx pattern, void *data)
229 if (GET_CODE (pattern) != CLOBBER && !REG_P (dest))
230 mark_insn ((rtx_insn *) data, false);
234 /* Mark INSN if BODY stores to a non-register destination. */
236 static void
237 mark_nonreg_stores (rtx body, rtx_insn *insn, bool fast)
239 if (fast)
240 note_stores (body, mark_nonreg_stores_1, insn);
241 else
242 note_stores (body, mark_nonreg_stores_2, insn);
246 /* Return true if store to MEM, starting OFF bytes from stack pointer,
247 is a call argument store, and clear corresponding bits from SP_BYTES
248 bitmap if it is. */
250 static bool
251 check_argument_store (rtx mem, HOST_WIDE_INT off, HOST_WIDE_INT min_sp_off,
252 HOST_WIDE_INT max_sp_off, bitmap sp_bytes)
254 HOST_WIDE_INT byte;
255 for (byte = off; byte < off + GET_MODE_SIZE (GET_MODE (mem)); byte++)
257 if (byte < min_sp_off
258 || byte >= max_sp_off
259 || !bitmap_clear_bit (sp_bytes, byte - min_sp_off))
260 return false;
262 return true;
266 /* Try to find all stack stores of CALL_INSN arguments if
267 ACCUMULATE_OUTGOING_ARGS. If all stack stores have been found
268 and it is therefore safe to eliminate the call, return true,
269 otherwise return false. This function should be first called
270 with DO_MARK false, and only when the CALL_INSN is actually
271 going to be marked called again with DO_MARK true. */
273 static bool
274 find_call_stack_args (rtx_call_insn *call_insn, bool do_mark, bool fast,
275 bitmap arg_stores)
277 rtx p;
278 rtx_insn *insn, *prev_insn;
279 bool ret;
280 HOST_WIDE_INT min_sp_off, max_sp_off;
281 bitmap sp_bytes;
283 gcc_assert (CALL_P (call_insn));
284 if (!ACCUMULATE_OUTGOING_ARGS)
285 return true;
287 if (!do_mark)
289 gcc_assert (arg_stores);
290 bitmap_clear (arg_stores);
293 min_sp_off = INTTYPE_MAXIMUM (HOST_WIDE_INT);
294 max_sp_off = 0;
296 /* First determine the minimum and maximum offset from sp for
297 stored arguments. */
298 for (p = CALL_INSN_FUNCTION_USAGE (call_insn); p; p = XEXP (p, 1))
299 if (GET_CODE (XEXP (p, 0)) == USE
300 && MEM_P (XEXP (XEXP (p, 0), 0)))
302 rtx mem = XEXP (XEXP (p, 0), 0), addr;
303 HOST_WIDE_INT off = 0, size;
304 if (!MEM_SIZE_KNOWN_P (mem))
305 return false;
306 size = MEM_SIZE (mem);
307 addr = XEXP (mem, 0);
308 if (GET_CODE (addr) == PLUS
309 && REG_P (XEXP (addr, 0))
310 && CONST_INT_P (XEXP (addr, 1)))
312 off = INTVAL (XEXP (addr, 1));
313 addr = XEXP (addr, 0);
315 if (addr != stack_pointer_rtx)
317 if (!REG_P (addr))
318 return false;
319 /* If not fast, use chains to see if addr wasn't set to
320 sp + offset. */
321 if (!fast)
323 df_ref use;
324 struct df_link *defs;
325 rtx set;
327 FOR_EACH_INSN_USE (use, call_insn)
328 if (rtx_equal_p (addr, DF_REF_REG (use)))
329 break;
331 if (use == NULL)
332 return false;
334 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
335 if (! DF_REF_IS_ARTIFICIAL (defs->ref))
336 break;
338 if (defs == NULL)
339 return false;
341 set = single_set (DF_REF_INSN (defs->ref));
342 if (!set)
343 return false;
345 if (GET_CODE (SET_SRC (set)) != PLUS
346 || XEXP (SET_SRC (set), 0) != stack_pointer_rtx
347 || !CONST_INT_P (XEXP (SET_SRC (set), 1)))
348 return false;
350 off += INTVAL (XEXP (SET_SRC (set), 1));
352 else
353 return false;
355 min_sp_off = MIN (min_sp_off, off);
356 max_sp_off = MAX (max_sp_off, off + size);
359 if (min_sp_off >= max_sp_off)
360 return true;
361 sp_bytes = BITMAP_ALLOC (NULL);
363 /* Set bits in SP_BYTES bitmap for bytes relative to sp + min_sp_off
364 which contain arguments. Checking has been done in the previous
365 loop. */
366 for (p = CALL_INSN_FUNCTION_USAGE (call_insn); p; p = XEXP (p, 1))
367 if (GET_CODE (XEXP (p, 0)) == USE
368 && MEM_P (XEXP (XEXP (p, 0), 0)))
370 rtx mem = XEXP (XEXP (p, 0), 0), addr;
371 HOST_WIDE_INT off = 0, byte;
372 addr = XEXP (mem, 0);
373 if (GET_CODE (addr) == PLUS
374 && REG_P (XEXP (addr, 0))
375 && CONST_INT_P (XEXP (addr, 1)))
377 off = INTVAL (XEXP (addr, 1));
378 addr = XEXP (addr, 0);
380 if (addr != stack_pointer_rtx)
382 df_ref use;
383 struct df_link *defs;
384 rtx set;
386 FOR_EACH_INSN_USE (use, call_insn)
387 if (rtx_equal_p (addr, DF_REF_REG (use)))
388 break;
390 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
391 if (! DF_REF_IS_ARTIFICIAL (defs->ref))
392 break;
394 set = single_set (DF_REF_INSN (defs->ref));
395 off += INTVAL (XEXP (SET_SRC (set), 1));
397 for (byte = off; byte < off + MEM_SIZE (mem); byte++)
399 if (!bitmap_set_bit (sp_bytes, byte - min_sp_off))
400 gcc_unreachable ();
404 /* Walk backwards, looking for argument stores. The search stops
405 when seeing another call, sp adjustment or memory store other than
406 argument store. */
407 ret = false;
408 for (insn = PREV_INSN (call_insn); insn; insn = prev_insn)
410 rtx set, mem, addr;
411 HOST_WIDE_INT off;
413 if (insn == BB_HEAD (BLOCK_FOR_INSN (call_insn)))
414 prev_insn = NULL;
415 else
416 prev_insn = PREV_INSN (insn);
418 if (CALL_P (insn))
419 break;
421 if (!NONDEBUG_INSN_P (insn))
422 continue;
424 set = single_set (insn);
425 if (!set || SET_DEST (set) == stack_pointer_rtx)
426 break;
428 if (!MEM_P (SET_DEST (set)))
429 continue;
431 mem = SET_DEST (set);
432 addr = XEXP (mem, 0);
433 off = 0;
434 if (GET_CODE (addr) == PLUS
435 && REG_P (XEXP (addr, 0))
436 && CONST_INT_P (XEXP (addr, 1)))
438 off = INTVAL (XEXP (addr, 1));
439 addr = XEXP (addr, 0);
441 if (addr != stack_pointer_rtx)
443 if (!REG_P (addr))
444 break;
445 if (!fast)
447 df_ref use;
448 struct df_link *defs;
449 rtx set;
451 FOR_EACH_INSN_USE (use, insn)
452 if (rtx_equal_p (addr, DF_REF_REG (use)))
453 break;
455 if (use == NULL)
456 break;
458 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
459 if (! DF_REF_IS_ARTIFICIAL (defs->ref))
460 break;
462 if (defs == NULL)
463 break;
465 set = single_set (DF_REF_INSN (defs->ref));
466 if (!set)
467 break;
469 if (GET_CODE (SET_SRC (set)) != PLUS
470 || XEXP (SET_SRC (set), 0) != stack_pointer_rtx
471 || !CONST_INT_P (XEXP (SET_SRC (set), 1)))
472 break;
474 off += INTVAL (XEXP (SET_SRC (set), 1));
476 else
477 break;
480 if (GET_MODE_SIZE (GET_MODE (mem)) == 0
481 || !check_argument_store (mem, off, min_sp_off,
482 max_sp_off, sp_bytes))
483 break;
485 if (!deletable_insn_p (insn, fast, NULL))
486 break;
488 if (do_mark)
489 mark_insn (insn, fast);
490 else
491 bitmap_set_bit (arg_stores, INSN_UID (insn));
493 if (bitmap_empty_p (sp_bytes))
495 ret = true;
496 break;
500 BITMAP_FREE (sp_bytes);
501 if (!ret && arg_stores)
502 bitmap_clear (arg_stores);
504 return ret;
508 /* Remove all REG_EQUAL and REG_EQUIV notes referring to the registers INSN
509 writes to. */
511 static void
512 remove_reg_equal_equiv_notes_for_defs (rtx_insn *insn)
514 df_ref def;
516 FOR_EACH_INSN_DEF (def, insn)
517 remove_reg_equal_equiv_notes_for_regno (DF_REF_REGNO (def));
520 /* Scan all BBs for debug insns and reset those that reference values
521 defined in unmarked insns. */
523 static void
524 reset_unmarked_insns_debug_uses (void)
526 basic_block bb;
527 rtx_insn *insn, *next;
529 FOR_EACH_BB_REVERSE_FN (bb, cfun)
530 FOR_BB_INSNS_REVERSE_SAFE (bb, insn, next)
531 if (DEBUG_INSN_P (insn))
533 df_ref use;
535 FOR_EACH_INSN_USE (use, insn)
537 struct df_link *defs;
538 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
540 rtx_insn *ref_insn;
541 if (DF_REF_IS_ARTIFICIAL (defs->ref))
542 continue;
543 ref_insn = DF_REF_INSN (defs->ref);
544 if (!marked_insn_p (ref_insn))
545 break;
547 if (!defs)
548 continue;
549 /* ??? FIXME could we propagate the values assigned to
550 each of the DEFs? */
551 INSN_VAR_LOCATION_LOC (insn) = gen_rtx_UNKNOWN_VAR_LOC ();
552 df_insn_rescan_debug_internal (insn);
553 break;
558 /* Delete every instruction that hasn't been marked. */
560 static void
561 delete_unmarked_insns (void)
563 basic_block bb;
564 rtx_insn *insn, *next;
565 bool must_clean = false;
567 FOR_EACH_BB_REVERSE_FN (bb, cfun)
568 FOR_BB_INSNS_REVERSE_SAFE (bb, insn, next)
569 if (NONDEBUG_INSN_P (insn))
571 /* Always delete no-op moves. */
572 if (noop_move_p (insn))
575 /* Otherwise rely only on the DCE algorithm. */
576 else if (marked_insn_p (insn))
577 continue;
579 /* Beware that reaching a dbg counter limit here can result
580 in miscompiled file. This occurs when a group of insns
581 must be deleted together, typically because the kept insn
582 depends on the output from the deleted insn. Deleting
583 this insns in reverse order (both at the bb level and
584 when looking at the blocks) minimizes this, but does not
585 eliminate it, since it is possible for the using insn to
586 be top of a block and the producer to be at the bottom of
587 the block. However, in most cases this will only result
588 in an uninitialized use of an insn that is dead anyway.
590 However, there is one rare case that will cause a
591 miscompile: deletion of non-looping pure and constant
592 calls on a machine where ACCUMULATE_OUTGOING_ARGS is true.
593 In this case it is possible to remove the call, but leave
594 the argument pushes to the stack. Because of the changes
595 to the stack pointer, this will almost always lead to a
596 miscompile. */
597 if (!dbg_cnt (dce))
598 continue;
600 if (dump_file)
601 fprintf (dump_file, "DCE: Deleting insn %d\n", INSN_UID (insn));
603 /* Before we delete the insn we have to remove the REG_EQUAL notes
604 for the destination regs in order to avoid dangling notes. */
605 remove_reg_equal_equiv_notes_for_defs (insn);
607 /* If a pure or const call is deleted, this may make the cfg
608 have unreachable blocks. We rememeber this and call
609 delete_unreachable_blocks at the end. */
610 if (CALL_P (insn))
611 must_clean = true;
613 /* Now delete the insn. */
614 delete_insn_and_edges (insn);
617 /* Deleted a pure or const call. */
618 if (must_clean)
619 delete_unreachable_blocks ();
623 /* Go through the instructions and mark those whose necessity is not
624 dependent on inter-instruction information. Make sure all other
625 instructions are not marked. */
627 static void
628 prescan_insns_for_dce (bool fast)
630 basic_block bb;
631 rtx_insn *insn, *prev;
632 bitmap arg_stores = NULL;
634 if (dump_file)
635 fprintf (dump_file, "Finding needed instructions:\n");
637 if (!df_in_progress && ACCUMULATE_OUTGOING_ARGS)
638 arg_stores = BITMAP_ALLOC (NULL);
640 FOR_EACH_BB_FN (bb, cfun)
642 FOR_BB_INSNS_REVERSE_SAFE (bb, insn, prev)
643 if (NONDEBUG_INSN_P (insn))
645 /* Don't mark argument stores now. They will be marked
646 if needed when the associated CALL is marked. */
647 if (arg_stores && bitmap_bit_p (arg_stores, INSN_UID (insn)))
648 continue;
649 if (deletable_insn_p (insn, fast, arg_stores))
650 mark_nonreg_stores (PATTERN (insn), insn, fast);
651 else
652 mark_insn (insn, fast);
654 /* find_call_stack_args only looks at argument stores in the
655 same bb. */
656 if (arg_stores)
657 bitmap_clear (arg_stores);
660 if (arg_stores)
661 BITMAP_FREE (arg_stores);
663 if (dump_file)
664 fprintf (dump_file, "Finished finding needed instructions:\n");
668 /* UD-based DSE routines. */
670 /* Mark instructions that define artificially-used registers, such as
671 the frame pointer and the stack pointer. */
673 static void
674 mark_artificial_uses (void)
676 basic_block bb;
677 struct df_link *defs;
678 df_ref use;
680 FOR_ALL_BB_FN (bb, cfun)
681 FOR_EACH_ARTIFICIAL_USE (use, bb->index)
682 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
683 if (!DF_REF_IS_ARTIFICIAL (defs->ref))
684 mark_insn (DF_REF_INSN (defs->ref), false);
688 /* Mark every instruction that defines a register value that INSN uses. */
690 static void
691 mark_reg_dependencies (rtx_insn *insn)
693 struct df_link *defs;
694 df_ref use;
696 if (DEBUG_INSN_P (insn))
697 return;
699 FOR_EACH_INSN_USE (use, insn)
701 if (dump_file)
703 fprintf (dump_file, "Processing use of ");
704 print_simple_rtl (dump_file, DF_REF_REG (use));
705 fprintf (dump_file, " in insn %d:\n", INSN_UID (insn));
707 for (defs = DF_REF_CHAIN (use); defs; defs = defs->next)
708 if (! DF_REF_IS_ARTIFICIAL (defs->ref))
709 mark_insn (DF_REF_INSN (defs->ref), false);
714 /* Initialize global variables for a new DCE pass. */
716 static void
717 init_dce (bool fast)
719 if (!df_in_progress)
721 if (!fast)
723 df_set_flags (DF_RD_PRUNE_DEAD_DEFS);
724 df_chain_add_problem (DF_UD_CHAIN);
726 df_analyze ();
729 if (dump_file)
730 df_dump (dump_file);
732 if (fast)
734 bitmap_obstack_initialize (&dce_blocks_bitmap_obstack);
735 bitmap_obstack_initialize (&dce_tmp_bitmap_obstack);
736 can_alter_cfg = false;
738 else
739 can_alter_cfg = true;
741 marked = sbitmap_alloc (get_max_uid () + 1);
742 bitmap_clear (marked);
746 /* Free the data allocated by init_dce. */
748 static void
749 fini_dce (bool fast)
751 sbitmap_free (marked);
753 if (fast)
755 bitmap_obstack_release (&dce_blocks_bitmap_obstack);
756 bitmap_obstack_release (&dce_tmp_bitmap_obstack);
761 /* UD-chain based DCE. */
763 static unsigned int
764 rest_of_handle_ud_dce (void)
766 rtx_insn *insn;
768 init_dce (false);
770 prescan_insns_for_dce (false);
771 mark_artificial_uses ();
772 while (worklist.length () > 0)
774 insn = worklist.pop ();
775 mark_reg_dependencies (insn);
777 worklist.release ();
779 if (MAY_HAVE_DEBUG_INSNS)
780 reset_unmarked_insns_debug_uses ();
782 /* Before any insns are deleted, we must remove the chains since
783 they are not bidirectional. */
784 df_remove_problem (df_chain);
785 delete_unmarked_insns ();
787 fini_dce (false);
788 return 0;
792 namespace {
794 const pass_data pass_data_ud_rtl_dce =
796 RTL_PASS, /* type */
797 "ud_dce", /* name */
798 OPTGROUP_NONE, /* optinfo_flags */
799 TV_DCE, /* tv_id */
800 0, /* properties_required */
801 0, /* properties_provided */
802 0, /* properties_destroyed */
803 0, /* todo_flags_start */
804 TODO_df_finish, /* todo_flags_finish */
807 class pass_ud_rtl_dce : public rtl_opt_pass
809 public:
810 pass_ud_rtl_dce (gcc::context *ctxt)
811 : rtl_opt_pass (pass_data_ud_rtl_dce, ctxt)
814 /* opt_pass methods: */
815 virtual bool gate (function *)
817 return optimize > 1 && flag_dce && dbg_cnt (dce_ud);
820 virtual unsigned int execute (function *)
822 return rest_of_handle_ud_dce ();
825 }; // class pass_ud_rtl_dce
827 } // anon namespace
829 rtl_opt_pass *
830 make_pass_ud_rtl_dce (gcc::context *ctxt)
832 return new pass_ud_rtl_dce (ctxt);
836 /* -------------------------------------------------------------------------
837 Fast DCE functions
838 ------------------------------------------------------------------------- */
840 /* Process basic block BB. Return true if the live_in set has
841 changed. REDO_OUT is true if the info at the bottom of the block
842 needs to be recalculated before starting. AU is the proper set of
843 artificial uses. Track global substitution of uses of dead pseudos
844 in debug insns using GLOBAL_DEBUG. */
846 static bool
847 word_dce_process_block (basic_block bb, bool redo_out,
848 struct dead_debug_global *global_debug)
850 bitmap local_live = BITMAP_ALLOC (&dce_tmp_bitmap_obstack);
851 rtx_insn *insn;
852 bool block_changed;
853 struct dead_debug_local debug;
855 if (redo_out)
857 /* Need to redo the live_out set of this block if when one of
858 the succs of this block has had a change in it live in
859 set. */
860 edge e;
861 edge_iterator ei;
862 df_confluence_function_n con_fun_n = df_word_lr->problem->con_fun_n;
863 bitmap_clear (DF_WORD_LR_OUT (bb));
864 FOR_EACH_EDGE (e, ei, bb->succs)
865 (*con_fun_n) (e);
868 if (dump_file)
870 fprintf (dump_file, "processing block %d live out = ", bb->index);
871 df_print_word_regset (dump_file, DF_WORD_LR_OUT (bb));
874 bitmap_copy (local_live, DF_WORD_LR_OUT (bb));
875 dead_debug_local_init (&debug, NULL, global_debug);
877 FOR_BB_INSNS_REVERSE (bb, insn)
878 if (DEBUG_INSN_P (insn))
880 df_ref use;
881 FOR_EACH_INSN_USE (use, insn)
882 if (DF_REF_REGNO (use) >= FIRST_PSEUDO_REGISTER
883 && (GET_MODE_SIZE (GET_MODE (DF_REF_REAL_REG (use)))
884 == 2 * UNITS_PER_WORD)
885 && !bitmap_bit_p (local_live, 2 * DF_REF_REGNO (use))
886 && !bitmap_bit_p (local_live, 2 * DF_REF_REGNO (use) + 1))
887 dead_debug_add (&debug, use, DF_REF_REGNO (use));
889 else if (INSN_P (insn))
891 bool any_changed;
893 /* No matter if the instruction is needed or not, we remove
894 any regno in the defs from the live set. */
895 any_changed = df_word_lr_simulate_defs (insn, local_live);
896 if (any_changed)
897 mark_insn (insn, true);
899 /* On the other hand, we do not allow the dead uses to set
900 anything in local_live. */
901 if (marked_insn_p (insn))
902 df_word_lr_simulate_uses (insn, local_live);
904 /* Insert debug temps for dead REGs used in subsequent debug
905 insns. We may have to emit a debug temp even if the insn
906 was marked, in case the debug use was after the point of
907 death. */
908 if (debug.used && !bitmap_empty_p (debug.used))
910 df_ref def;
912 FOR_EACH_INSN_DEF (def, insn)
913 dead_debug_insert_temp (&debug, DF_REF_REGNO (def), insn,
914 marked_insn_p (insn)
915 && !control_flow_insn_p (insn)
916 ? DEBUG_TEMP_AFTER_WITH_REG_FORCE
917 : DEBUG_TEMP_BEFORE_WITH_VALUE);
920 if (dump_file)
922 fprintf (dump_file, "finished processing insn %d live out = ",
923 INSN_UID (insn));
924 df_print_word_regset (dump_file, local_live);
928 block_changed = !bitmap_equal_p (local_live, DF_WORD_LR_IN (bb));
929 if (block_changed)
930 bitmap_copy (DF_WORD_LR_IN (bb), local_live);
932 dead_debug_local_finish (&debug, NULL);
933 BITMAP_FREE (local_live);
934 return block_changed;
938 /* Process basic block BB. Return true if the live_in set has
939 changed. REDO_OUT is true if the info at the bottom of the block
940 needs to be recalculated before starting. AU is the proper set of
941 artificial uses. Track global substitution of uses of dead pseudos
942 in debug insns using GLOBAL_DEBUG. */
944 static bool
945 dce_process_block (basic_block bb, bool redo_out, bitmap au,
946 struct dead_debug_global *global_debug)
948 bitmap local_live = BITMAP_ALLOC (&dce_tmp_bitmap_obstack);
949 rtx_insn *insn;
950 bool block_changed;
951 df_ref def;
952 struct dead_debug_local debug;
954 if (redo_out)
956 /* Need to redo the live_out set of this block if when one of
957 the succs of this block has had a change in it live in
958 set. */
959 edge e;
960 edge_iterator ei;
961 df_confluence_function_n con_fun_n = df_lr->problem->con_fun_n;
962 bitmap_clear (DF_LR_OUT (bb));
963 FOR_EACH_EDGE (e, ei, bb->succs)
964 (*con_fun_n) (e);
967 if (dump_file)
969 fprintf (dump_file, "processing block %d lr out = ", bb->index);
970 df_print_regset (dump_file, DF_LR_OUT (bb));
973 bitmap_copy (local_live, DF_LR_OUT (bb));
975 df_simulate_initialize_backwards (bb, local_live);
976 dead_debug_local_init (&debug, NULL, global_debug);
978 FOR_BB_INSNS_REVERSE (bb, insn)
979 if (DEBUG_INSN_P (insn))
981 df_ref use;
982 FOR_EACH_INSN_USE (use, insn)
983 if (!bitmap_bit_p (local_live, DF_REF_REGNO (use))
984 && !bitmap_bit_p (au, DF_REF_REGNO (use)))
985 dead_debug_add (&debug, use, DF_REF_REGNO (use));
987 else if (INSN_P (insn))
989 bool needed = marked_insn_p (insn);
991 /* The insn is needed if there is someone who uses the output. */
992 if (!needed)
993 FOR_EACH_INSN_DEF (def, insn)
994 if (bitmap_bit_p (local_live, DF_REF_REGNO (def))
995 || bitmap_bit_p (au, DF_REF_REGNO (def)))
997 needed = true;
998 mark_insn (insn, true);
999 break;
1002 /* No matter if the instruction is needed or not, we remove
1003 any regno in the defs from the live set. */
1004 df_simulate_defs (insn, local_live);
1006 /* On the other hand, we do not allow the dead uses to set
1007 anything in local_live. */
1008 if (needed)
1009 df_simulate_uses (insn, local_live);
1011 /* Insert debug temps for dead REGs used in subsequent debug
1012 insns. We may have to emit a debug temp even if the insn
1013 was marked, in case the debug use was after the point of
1014 death. */
1015 if (debug.used && !bitmap_empty_p (debug.used))
1016 FOR_EACH_INSN_DEF (def, insn)
1017 dead_debug_insert_temp (&debug, DF_REF_REGNO (def), insn,
1018 needed && !control_flow_insn_p (insn)
1019 ? DEBUG_TEMP_AFTER_WITH_REG_FORCE
1020 : DEBUG_TEMP_BEFORE_WITH_VALUE);
1023 dead_debug_local_finish (&debug, NULL);
1024 df_simulate_finalize_backwards (bb, local_live);
1026 block_changed = !bitmap_equal_p (local_live, DF_LR_IN (bb));
1027 if (block_changed)
1028 bitmap_copy (DF_LR_IN (bb), local_live);
1030 BITMAP_FREE (local_live);
1031 return block_changed;
1035 /* Perform fast DCE once initialization is done. If WORD_LEVEL is
1036 true, use the word level dce, otherwise do it at the pseudo
1037 level. */
1039 static void
1040 fast_dce (bool word_level)
1042 int *postorder = df_get_postorder (DF_BACKWARD);
1043 int n_blocks = df_get_n_blocks (DF_BACKWARD);
1044 /* The set of blocks that have been seen on this iteration. */
1045 bitmap processed = BITMAP_ALLOC (&dce_blocks_bitmap_obstack);
1046 /* The set of blocks that need to have the out vectors reset because
1047 the in of one of their successors has changed. */
1048 bitmap redo_out = BITMAP_ALLOC (&dce_blocks_bitmap_obstack);
1049 bitmap all_blocks = BITMAP_ALLOC (&dce_blocks_bitmap_obstack);
1050 bool global_changed = true;
1052 /* These regs are considered always live so if they end up dying
1053 because of some def, we need to bring the back again. Calling
1054 df_simulate_fixup_sets has the disadvantage of calling
1055 bb_has_eh_pred once per insn, so we cache the information
1056 here. */
1057 bitmap au = &df->regular_block_artificial_uses;
1058 bitmap au_eh = &df->eh_block_artificial_uses;
1059 int i;
1060 struct dead_debug_global global_debug;
1062 prescan_insns_for_dce (true);
1064 for (i = 0; i < n_blocks; i++)
1065 bitmap_set_bit (all_blocks, postorder[i]);
1067 dead_debug_global_init (&global_debug, NULL);
1069 while (global_changed)
1071 global_changed = false;
1073 for (i = 0; i < n_blocks; i++)
1075 int index = postorder[i];
1076 basic_block bb = BASIC_BLOCK_FOR_FN (cfun, index);
1077 bool local_changed;
1079 if (index < NUM_FIXED_BLOCKS)
1081 bitmap_set_bit (processed, index);
1082 continue;
1085 if (word_level)
1086 local_changed
1087 = word_dce_process_block (bb, bitmap_bit_p (redo_out, index),
1088 &global_debug);
1089 else
1090 local_changed
1091 = dce_process_block (bb, bitmap_bit_p (redo_out, index),
1092 bb_has_eh_pred (bb) ? au_eh : au,
1093 &global_debug);
1094 bitmap_set_bit (processed, index);
1096 if (local_changed)
1098 edge e;
1099 edge_iterator ei;
1100 FOR_EACH_EDGE (e, ei, bb->preds)
1101 if (bitmap_bit_p (processed, e->src->index))
1102 /* Be tricky about when we need to iterate the
1103 analysis. We only have redo the analysis if the
1104 bitmaps change at the top of a block that is the
1105 entry to a loop. */
1106 global_changed = true;
1107 else
1108 bitmap_set_bit (redo_out, e->src->index);
1112 if (global_changed)
1114 /* Turn off the RUN_DCE flag to prevent recursive calls to
1115 dce. */
1116 int old_flag = df_clear_flags (DF_LR_RUN_DCE);
1118 /* So something was deleted that requires a redo. Do it on
1119 the cheap. */
1120 delete_unmarked_insns ();
1121 bitmap_clear (marked);
1122 bitmap_clear (processed);
1123 bitmap_clear (redo_out);
1125 /* We do not need to rescan any instructions. We only need
1126 to redo the dataflow equations for the blocks that had a
1127 change at the top of the block. Then we need to redo the
1128 iteration. */
1129 if (word_level)
1130 df_analyze_problem (df_word_lr, all_blocks, postorder, n_blocks);
1131 else
1132 df_analyze_problem (df_lr, all_blocks, postorder, n_blocks);
1134 if (old_flag & DF_LR_RUN_DCE)
1135 df_set_flags (DF_LR_RUN_DCE);
1137 prescan_insns_for_dce (true);
1141 dead_debug_global_finish (&global_debug, NULL);
1143 delete_unmarked_insns ();
1145 BITMAP_FREE (processed);
1146 BITMAP_FREE (redo_out);
1147 BITMAP_FREE (all_blocks);
1151 /* Fast register level DCE. */
1153 static unsigned int
1154 rest_of_handle_fast_dce (void)
1156 init_dce (true);
1157 fast_dce (false);
1158 fini_dce (true);
1159 return 0;
1163 /* Fast byte level DCE. */
1165 void
1166 run_word_dce (void)
1168 int old_flags;
1170 if (!flag_dce)
1171 return;
1173 timevar_push (TV_DCE);
1174 old_flags = df_clear_flags (DF_DEFER_INSN_RESCAN + DF_NO_INSN_RESCAN);
1175 df_word_lr_add_problem ();
1176 init_dce (true);
1177 fast_dce (true);
1178 fini_dce (true);
1179 df_set_flags (old_flags);
1180 timevar_pop (TV_DCE);
1184 /* This is an internal call that is used by the df live register
1185 problem to run fast dce as a side effect of creating the live
1186 information. The stack is organized so that the lr problem is run,
1187 this pass is run, which updates the live info and the df scanning
1188 info, and then returns to allow the rest of the problems to be run.
1190 This can be called by elsewhere but it will not update the bit
1191 vectors for any other problems than LR. */
1193 void
1194 run_fast_df_dce (void)
1196 if (flag_dce)
1198 /* If dce is able to delete something, it has to happen
1199 immediately. Otherwise there will be problems handling the
1200 eq_notes. */
1201 int old_flags =
1202 df_clear_flags (DF_DEFER_INSN_RESCAN + DF_NO_INSN_RESCAN);
1204 df_in_progress = true;
1205 rest_of_handle_fast_dce ();
1206 df_in_progress = false;
1208 df_set_flags (old_flags);
1213 /* Run a fast DCE pass. */
1215 void
1216 run_fast_dce (void)
1218 if (flag_dce)
1219 rest_of_handle_fast_dce ();
1223 namespace {
1225 const pass_data pass_data_fast_rtl_dce =
1227 RTL_PASS, /* type */
1228 "rtl_dce", /* name */
1229 OPTGROUP_NONE, /* optinfo_flags */
1230 TV_DCE, /* tv_id */
1231 0, /* properties_required */
1232 0, /* properties_provided */
1233 0, /* properties_destroyed */
1234 0, /* todo_flags_start */
1235 TODO_df_finish, /* todo_flags_finish */
1238 class pass_fast_rtl_dce : public rtl_opt_pass
1240 public:
1241 pass_fast_rtl_dce (gcc::context *ctxt)
1242 : rtl_opt_pass (pass_data_fast_rtl_dce, ctxt)
1245 /* opt_pass methods: */
1246 virtual bool gate (function *)
1248 return optimize > 0 && flag_dce && dbg_cnt (dce_fast);
1251 virtual unsigned int execute (function *)
1253 return rest_of_handle_fast_dce ();
1256 }; // class pass_fast_rtl_dce
1258 } // anon namespace
1260 rtl_opt_pass *
1261 make_pass_fast_rtl_dce (gcc::context *ctxt)
1263 return new pass_fast_rtl_dce (ctxt);