re PR middle-end/91603 (Unaligned access in expand_assignment)
[official-gcc.git] / gcc / sanopt.c
blob00ade87283223798038e58c37e9138fe483de5a1
1 /* Optimize and expand sanitizer functions.
2 Copyright (C) 2014-2019 Free Software Foundation, Inc.
3 Contributed by Marek Polacek <polacek@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "backend.h"
25 #include "tree.h"
26 #include "gimple.h"
27 #include "ssa.h"
28 #include "tree-pass.h"
29 #include "tree-ssa-operands.h"
30 #include "gimple-pretty-print.h"
31 #include "fold-const.h"
32 #include "gimple-iterator.h"
33 #include "stringpool.h"
34 #include "attribs.h"
35 #include "asan.h"
36 #include "ubsan.h"
37 #include "params.h"
38 #include "tree-hash-traits.h"
39 #include "gimple-ssa.h"
40 #include "tree-phinodes.h"
41 #include "ssa-iterators.h"
42 #include "gimplify.h"
43 #include "gimple-iterator.h"
44 #include "gimple-walk.h"
45 #include "cfghooks.h"
46 #include "tree-dfa.h"
47 #include "tree-ssa.h"
48 #include "varasm.h"
50 /* This is used to carry information about basic blocks. It is
51 attached to the AUX field of the standard CFG block. */
53 struct sanopt_info
55 /* True if this BB might call (directly or indirectly) free/munmap
56 or similar operation. */
57 bool has_freeing_call_p;
59 /* True if HAS_FREEING_CALL_P flag has been computed. */
60 bool has_freeing_call_computed_p;
62 /* True if there is a block with HAS_FREEING_CALL_P flag set
63 on any path between an immediate dominator of BB, denoted
64 imm(BB), and BB. */
65 bool imm_dom_path_with_freeing_call_p;
67 /* True if IMM_DOM_PATH_WITH_FREEING_CALL_P has been computed. */
68 bool imm_dom_path_with_freeing_call_computed_p;
70 /* Number of possibly freeing calls encountered in this bb
71 (so far). */
72 uint64_t freeing_call_events;
74 /* True if BB is currently being visited during computation
75 of IMM_DOM_PATH_WITH_FREEING_CALL_P flag. */
76 bool being_visited_p;
78 /* True if this BB has been visited in the dominator walk. */
79 bool visited_p;
82 /* If T has a single definition of form T = T2, return T2. */
84 static tree
85 maybe_get_single_definition (tree t)
87 if (TREE_CODE (t) == SSA_NAME)
89 gimple *g = SSA_NAME_DEF_STMT (t);
90 if (gimple_assign_single_p (g))
91 return gimple_assign_rhs1 (g);
93 return NULL_TREE;
96 /* Tree triplet for vptr_check_map. */
97 struct sanopt_tree_triplet
99 tree t1, t2, t3;
102 /* Traits class for tree triplet hash maps below. */
104 struct sanopt_tree_triplet_hash : typed_noop_remove <sanopt_tree_triplet>
106 typedef sanopt_tree_triplet value_type;
107 typedef sanopt_tree_triplet compare_type;
109 static hashval_t
110 hash (const sanopt_tree_triplet &ref)
112 inchash::hash hstate (0);
113 inchash::add_expr (ref.t1, hstate);
114 inchash::add_expr (ref.t2, hstate);
115 inchash::add_expr (ref.t3, hstate);
116 return hstate.end ();
119 static bool
120 equal (const sanopt_tree_triplet &ref1, const sanopt_tree_triplet &ref2)
122 return operand_equal_p (ref1.t1, ref2.t1, 0)
123 && operand_equal_p (ref1.t2, ref2.t2, 0)
124 && operand_equal_p (ref1.t3, ref2.t3, 0);
127 static void
128 mark_deleted (sanopt_tree_triplet &ref)
130 ref.t1 = reinterpret_cast<tree> (1);
133 static void
134 mark_empty (sanopt_tree_triplet &ref)
136 ref.t1 = NULL;
139 static bool
140 is_deleted (const sanopt_tree_triplet &ref)
142 return ref.t1 == reinterpret_cast<tree> (1);
145 static bool
146 is_empty (const sanopt_tree_triplet &ref)
148 return ref.t1 == NULL;
152 /* Tree couple for ptr_check_map. */
153 struct sanopt_tree_couple
155 tree ptr;
156 bool pos_p;
159 /* Traits class for tree triplet hash maps below. */
161 struct sanopt_tree_couple_hash : typed_noop_remove <sanopt_tree_couple>
163 typedef sanopt_tree_couple value_type;
164 typedef sanopt_tree_couple compare_type;
166 static hashval_t
167 hash (const sanopt_tree_couple &ref)
169 inchash::hash hstate (0);
170 inchash::add_expr (ref.ptr, hstate);
171 hstate.add_int (ref.pos_p);
172 return hstate.end ();
175 static bool
176 equal (const sanopt_tree_couple &ref1, const sanopt_tree_couple &ref2)
178 return operand_equal_p (ref1.ptr, ref2.ptr, 0)
179 && ref1.pos_p == ref2.pos_p;
182 static void
183 mark_deleted (sanopt_tree_couple &ref)
185 ref.ptr = reinterpret_cast<tree> (1);
188 static void
189 mark_empty (sanopt_tree_couple &ref)
191 ref.ptr = NULL;
194 static bool
195 is_deleted (const sanopt_tree_couple &ref)
197 return ref.ptr == reinterpret_cast<tree> (1);
200 static bool
201 is_empty (const sanopt_tree_couple &ref)
203 return ref.ptr == NULL;
207 /* This is used to carry various hash maps and variables used
208 in sanopt_optimize_walker. */
210 class sanopt_ctx
212 public:
213 /* This map maps a pointer (the first argument of UBSAN_NULL) to
214 a vector of UBSAN_NULL call statements that check this pointer. */
215 hash_map<tree, auto_vec<gimple *> > null_check_map;
217 /* This map maps a pointer (the second argument of ASAN_CHECK) to
218 a vector of ASAN_CHECK call statements that check the access. */
219 hash_map<tree_operand_hash, auto_vec<gimple *> > asan_check_map;
221 /* This map maps a tree triplet (the first, second and fourth argument
222 of UBSAN_VPTR) to a vector of UBSAN_VPTR call statements that check
223 that virtual table pointer. */
224 hash_map<sanopt_tree_triplet_hash, auto_vec<gimple *> > vptr_check_map;
226 /* This map maps a couple (tree and boolean) to a vector of UBSAN_PTR
227 call statements that check that pointer overflow. */
228 hash_map<sanopt_tree_couple_hash, auto_vec<gimple *> > ptr_check_map;
230 /* Number of IFN_ASAN_CHECK statements. */
231 int asan_num_accesses;
233 /* True when the current functions constains an ASAN_MARK. */
234 bool contains_asan_mark;
237 /* Return true if there might be any call to free/munmap operation
238 on any path in between DOM (which should be imm(BB)) and BB. */
240 static bool
241 imm_dom_path_with_freeing_call (basic_block bb, basic_block dom)
243 sanopt_info *info = (sanopt_info *) bb->aux;
244 edge e;
245 edge_iterator ei;
247 if (info->imm_dom_path_with_freeing_call_computed_p)
248 return info->imm_dom_path_with_freeing_call_p;
250 info->being_visited_p = true;
252 FOR_EACH_EDGE (e, ei, bb->preds)
254 sanopt_info *pred_info = (sanopt_info *) e->src->aux;
256 if (e->src == dom)
257 continue;
259 if ((pred_info->imm_dom_path_with_freeing_call_computed_p
260 && pred_info->imm_dom_path_with_freeing_call_p)
261 || (pred_info->has_freeing_call_computed_p
262 && pred_info->has_freeing_call_p))
264 info->imm_dom_path_with_freeing_call_computed_p = true;
265 info->imm_dom_path_with_freeing_call_p = true;
266 info->being_visited_p = false;
267 return true;
271 FOR_EACH_EDGE (e, ei, bb->preds)
273 sanopt_info *pred_info = (sanopt_info *) e->src->aux;
275 if (e->src == dom)
276 continue;
278 if (pred_info->has_freeing_call_computed_p)
279 continue;
281 gimple_stmt_iterator gsi;
282 for (gsi = gsi_start_bb (e->src); !gsi_end_p (gsi); gsi_next (&gsi))
284 gimple *stmt = gsi_stmt (gsi);
285 gasm *asm_stmt;
287 if ((is_gimple_call (stmt) && !nonfreeing_call_p (stmt))
288 || ((asm_stmt = dyn_cast <gasm *> (stmt))
289 && (gimple_asm_clobbers_memory_p (asm_stmt)
290 || gimple_asm_volatile_p (asm_stmt))))
292 pred_info->has_freeing_call_p = true;
293 break;
297 pred_info->has_freeing_call_computed_p = true;
298 if (pred_info->has_freeing_call_p)
300 info->imm_dom_path_with_freeing_call_computed_p = true;
301 info->imm_dom_path_with_freeing_call_p = true;
302 info->being_visited_p = false;
303 return true;
307 FOR_EACH_EDGE (e, ei, bb->preds)
309 if (e->src == dom)
310 continue;
312 basic_block src;
313 for (src = e->src; src != dom; )
315 sanopt_info *pred_info = (sanopt_info *) src->aux;
316 if (pred_info->being_visited_p)
317 break;
318 basic_block imm = get_immediate_dominator (CDI_DOMINATORS, src);
319 if (imm_dom_path_with_freeing_call (src, imm))
321 info->imm_dom_path_with_freeing_call_computed_p = true;
322 info->imm_dom_path_with_freeing_call_p = true;
323 info->being_visited_p = false;
324 return true;
326 src = imm;
330 info->imm_dom_path_with_freeing_call_computed_p = true;
331 info->imm_dom_path_with_freeing_call_p = false;
332 info->being_visited_p = false;
333 return false;
336 /* Get the first dominating check from the list of stored checks.
337 Non-dominating checks are silently dropped. */
339 static gimple *
340 maybe_get_dominating_check (auto_vec<gimple *> &v)
342 for (; !v.is_empty (); v.pop ())
344 gimple *g = v.last ();
345 sanopt_info *si = (sanopt_info *) gimple_bb (g)->aux;
346 if (!si->visited_p)
347 /* At this point we shouldn't have any statements
348 that aren't dominating the current BB. */
349 return g;
351 return NULL;
354 /* Optimize away redundant UBSAN_NULL calls. */
356 static bool
357 maybe_optimize_ubsan_null_ifn (class sanopt_ctx *ctx, gimple *stmt)
359 gcc_assert (gimple_call_num_args (stmt) == 3);
360 tree ptr = gimple_call_arg (stmt, 0);
361 tree cur_align = gimple_call_arg (stmt, 2);
362 gcc_assert (TREE_CODE (cur_align) == INTEGER_CST);
363 bool remove = false;
365 auto_vec<gimple *> &v = ctx->null_check_map.get_or_insert (ptr);
366 gimple *g = maybe_get_dominating_check (v);
367 if (!g)
369 /* For this PTR we don't have any UBSAN_NULL stmts recorded, so there's
370 nothing to optimize yet. */
371 v.safe_push (stmt);
372 return false;
375 /* We already have recorded a UBSAN_NULL check for this pointer. Perhaps we
376 can drop this one. But only if this check doesn't specify stricter
377 alignment. */
379 tree align = gimple_call_arg (g, 2);
380 int kind = tree_to_shwi (gimple_call_arg (g, 1));
381 /* If this is a NULL pointer check where we had segv anyway, we can
382 remove it. */
383 if (integer_zerop (align)
384 && (kind == UBSAN_LOAD_OF
385 || kind == UBSAN_STORE_OF
386 || kind == UBSAN_MEMBER_ACCESS))
387 remove = true;
388 /* Otherwise remove the check in non-recovering mode, or if the
389 stmts have same location. */
390 else if (integer_zerop (align))
391 remove = (flag_sanitize_recover & SANITIZE_NULL) == 0
392 || flag_sanitize_undefined_trap_on_error
393 || gimple_location (g) == gimple_location (stmt);
394 else if (tree_int_cst_le (cur_align, align))
395 remove = (flag_sanitize_recover & SANITIZE_ALIGNMENT) == 0
396 || flag_sanitize_undefined_trap_on_error
397 || gimple_location (g) == gimple_location (stmt);
399 if (!remove && gimple_bb (g) == gimple_bb (stmt)
400 && tree_int_cst_compare (cur_align, align) == 0)
401 v.pop ();
403 if (!remove)
404 v.safe_push (stmt);
405 return remove;
408 /* Return true when pointer PTR for a given CUR_OFFSET is already sanitized
409 in a given sanitization context CTX. */
411 static bool
412 has_dominating_ubsan_ptr_check (sanopt_ctx *ctx, tree ptr,
413 offset_int &cur_offset)
415 bool pos_p = !wi::neg_p (cur_offset);
416 sanopt_tree_couple couple;
417 couple.ptr = ptr;
418 couple.pos_p = pos_p;
420 auto_vec<gimple *> &v = ctx->ptr_check_map.get_or_insert (couple);
421 gimple *g = maybe_get_dominating_check (v);
422 if (!g)
423 return false;
425 /* We already have recorded a UBSAN_PTR check for this pointer. Perhaps we
426 can drop this one. But only if this check doesn't specify larger offset.
428 tree offset = gimple_call_arg (g, 1);
429 gcc_assert (TREE_CODE (offset) == INTEGER_CST);
430 offset_int ooffset = wi::sext (wi::to_offset (offset), POINTER_SIZE);
432 if (pos_p)
434 if (wi::les_p (cur_offset, ooffset))
435 return true;
437 else if (!pos_p && wi::les_p (ooffset, cur_offset))
438 return true;
440 return false;
443 /* Record UBSAN_PTR check of given context CTX. Register pointer PTR on
444 a given OFFSET that it's handled by GIMPLE STMT. */
446 static void
447 record_ubsan_ptr_check_stmt (sanopt_ctx *ctx, gimple *stmt, tree ptr,
448 const offset_int &offset)
450 sanopt_tree_couple couple;
451 couple.ptr = ptr;
452 couple.pos_p = !wi::neg_p (offset);
454 auto_vec<gimple *> &v = ctx->ptr_check_map.get_or_insert (couple);
455 v.safe_push (stmt);
458 /* Optimize away redundant UBSAN_PTR calls. */
460 static bool
461 maybe_optimize_ubsan_ptr_ifn (sanopt_ctx *ctx, gimple *stmt)
463 poly_int64 bitsize, pbitpos;
464 machine_mode mode;
465 int volatilep = 0, reversep, unsignedp = 0;
466 tree offset;
468 gcc_assert (gimple_call_num_args (stmt) == 2);
469 tree ptr = gimple_call_arg (stmt, 0);
470 tree off = gimple_call_arg (stmt, 1);
472 if (TREE_CODE (off) != INTEGER_CST)
473 return false;
475 if (integer_zerop (off))
476 return true;
478 offset_int cur_offset = wi::sext (wi::to_offset (off), POINTER_SIZE);
479 if (has_dominating_ubsan_ptr_check (ctx, ptr, cur_offset))
480 return true;
482 tree base = ptr;
483 if (TREE_CODE (base) == ADDR_EXPR)
485 base = TREE_OPERAND (base, 0);
487 HOST_WIDE_INT bitpos;
488 base = get_inner_reference (base, &bitsize, &pbitpos, &offset, &mode,
489 &unsignedp, &reversep, &volatilep);
490 if ((offset == NULL_TREE || TREE_CODE (offset) == INTEGER_CST)
491 && DECL_P (base)
492 && !DECL_REGISTER (base)
493 && pbitpos.is_constant (&bitpos))
495 offset_int expr_offset;
496 if (offset)
497 expr_offset = wi::to_offset (offset) + bitpos / BITS_PER_UNIT;
498 else
499 expr_offset = bitpos / BITS_PER_UNIT;
500 expr_offset = wi::sext (expr_offset, POINTER_SIZE);
501 offset_int total_offset = expr_offset + cur_offset;
502 if (total_offset != wi::sext (total_offset, POINTER_SIZE))
504 record_ubsan_ptr_check_stmt (ctx, stmt, ptr, cur_offset);
505 return false;
508 /* If BASE is a fixed size automatic variable or
509 global variable defined in the current TU, we don't have
510 to instrument anything if offset is within address
511 of the variable. */
512 if ((VAR_P (base)
513 || TREE_CODE (base) == PARM_DECL
514 || TREE_CODE (base) == RESULT_DECL)
515 && DECL_SIZE_UNIT (base)
516 && TREE_CODE (DECL_SIZE_UNIT (base)) == INTEGER_CST
517 && (!is_global_var (base) || decl_binds_to_current_def_p (base)))
519 offset_int base_size = wi::to_offset (DECL_SIZE_UNIT (base));
520 if (!wi::neg_p (expr_offset)
521 && wi::les_p (total_offset, base_size))
523 if (!wi::neg_p (total_offset)
524 && wi::les_p (total_offset, base_size))
525 return true;
529 /* Following expression: UBSAN_PTR (&MEM_REF[ptr + x], y) can be
530 handled as follows:
532 1) sign (x) == sign (y), then check for dominating check of (x + y)
533 2) sign (x) != sign (y), then first check if we have a dominating
534 check for ptr + x. If so, then we have 2 situations:
535 a) sign (x) == sign (x + y), here we are done, example:
536 UBSAN_PTR (&MEM_REF[ptr + 100], -50)
537 b) check for dominating check of ptr + x + y.
540 bool sign_cur_offset = !wi::neg_p (cur_offset);
541 bool sign_expr_offset = !wi::neg_p (expr_offset);
543 tree base_addr
544 = build1 (ADDR_EXPR, build_pointer_type (TREE_TYPE (base)), base);
546 bool add = false;
547 if (sign_cur_offset == sign_expr_offset)
549 if (has_dominating_ubsan_ptr_check (ctx, base_addr, total_offset))
550 return true;
551 else
552 add = true;
554 else
556 if (!has_dominating_ubsan_ptr_check (ctx, base_addr, expr_offset))
557 ; /* Don't record base_addr + expr_offset, it's not a guarding
558 check. */
559 else
561 bool sign_total_offset = !wi::neg_p (total_offset);
562 if (sign_expr_offset == sign_total_offset)
563 return true;
564 else
566 if (has_dominating_ubsan_ptr_check (ctx, base_addr,
567 total_offset))
568 return true;
569 else
570 add = true;
575 /* Record a new dominating check for base_addr + total_offset. */
576 if (add && !operand_equal_p (base, base_addr, 0))
577 record_ubsan_ptr_check_stmt (ctx, stmt, base_addr,
578 total_offset);
582 /* For this PTR we don't have any UBSAN_PTR stmts recorded, so there's
583 nothing to optimize yet. */
584 record_ubsan_ptr_check_stmt (ctx, stmt, ptr, cur_offset);
586 return false;
589 /* Optimize away redundant UBSAN_VPTR calls. The second argument
590 is the value loaded from the virtual table, so rely on FRE to find out
591 when we can actually optimize. */
593 static bool
594 maybe_optimize_ubsan_vptr_ifn (class sanopt_ctx *ctx, gimple *stmt)
596 gcc_assert (gimple_call_num_args (stmt) == 5);
597 sanopt_tree_triplet triplet;
598 triplet.t1 = gimple_call_arg (stmt, 0);
599 triplet.t2 = gimple_call_arg (stmt, 1);
600 triplet.t3 = gimple_call_arg (stmt, 3);
602 auto_vec<gimple *> &v = ctx->vptr_check_map.get_or_insert (triplet);
603 gimple *g = maybe_get_dominating_check (v);
604 if (!g)
606 /* For this PTR we don't have any UBSAN_VPTR stmts recorded, so there's
607 nothing to optimize yet. */
608 v.safe_push (stmt);
609 return false;
612 return true;
615 /* Returns TRUE if ASan check of length LEN in block BB can be removed
616 if preceded by checks in V. */
618 static bool
619 can_remove_asan_check (auto_vec<gimple *> &v, tree len, basic_block bb)
621 unsigned int i;
622 gimple *g;
623 gimple *to_pop = NULL;
624 bool remove = false;
625 basic_block last_bb = bb;
626 bool cleanup = false;
628 FOR_EACH_VEC_ELT_REVERSE (v, i, g)
630 basic_block gbb = gimple_bb (g);
631 sanopt_info *si = (sanopt_info *) gbb->aux;
632 if (gimple_uid (g) < si->freeing_call_events)
634 /* If there is a potentially freeing call after g in gbb, we should
635 remove it from the vector, can't use in optimization. */
636 cleanup = true;
637 continue;
640 tree glen = gimple_call_arg (g, 2);
641 gcc_assert (TREE_CODE (glen) == INTEGER_CST);
643 /* If we've checked only smaller length than we want to check now,
644 we can't remove the current stmt. If g is in the same basic block,
645 we want to remove it though, as the current stmt is better. */
646 if (tree_int_cst_lt (glen, len))
648 if (gbb == bb)
650 to_pop = g;
651 cleanup = true;
653 continue;
656 while (last_bb != gbb)
658 /* Paths from last_bb to bb have been checked before.
659 gbb is necessarily a dominator of last_bb, but not necessarily
660 immediate dominator. */
661 if (((sanopt_info *) last_bb->aux)->freeing_call_events)
662 break;
664 basic_block imm = get_immediate_dominator (CDI_DOMINATORS, last_bb);
665 gcc_assert (imm);
666 if (imm_dom_path_with_freeing_call (last_bb, imm))
667 break;
669 last_bb = imm;
671 if (last_bb == gbb)
672 remove = true;
673 break;
676 if (cleanup)
678 unsigned int j = 0, l = v.length ();
679 for (i = 0; i < l; i++)
680 if (v[i] != to_pop
681 && (gimple_uid (v[i])
682 == ((sanopt_info *)
683 gimple_bb (v[i])->aux)->freeing_call_events))
685 if (i != j)
686 v[j] = v[i];
687 j++;
689 v.truncate (j);
692 return remove;
695 /* Optimize away redundant ASAN_CHECK calls. */
697 static bool
698 maybe_optimize_asan_check_ifn (class sanopt_ctx *ctx, gimple *stmt)
700 gcc_assert (gimple_call_num_args (stmt) == 4);
701 tree ptr = gimple_call_arg (stmt, 1);
702 tree len = gimple_call_arg (stmt, 2);
703 basic_block bb = gimple_bb (stmt);
704 sanopt_info *info = (sanopt_info *) bb->aux;
706 if (TREE_CODE (len) != INTEGER_CST)
707 return false;
708 if (integer_zerop (len))
709 return false;
711 gimple_set_uid (stmt, info->freeing_call_events);
713 auto_vec<gimple *> *ptr_checks = &ctx->asan_check_map.get_or_insert (ptr);
715 tree base_addr = maybe_get_single_definition (ptr);
716 auto_vec<gimple *> *base_checks = NULL;
717 if (base_addr)
719 base_checks = &ctx->asan_check_map.get_or_insert (base_addr);
720 /* Original pointer might have been invalidated. */
721 ptr_checks = ctx->asan_check_map.get (ptr);
724 gimple *g = maybe_get_dominating_check (*ptr_checks);
725 gimple *g2 = NULL;
727 if (base_checks)
728 /* Try with base address as well. */
729 g2 = maybe_get_dominating_check (*base_checks);
731 if (g == NULL && g2 == NULL)
733 /* For this PTR we don't have any ASAN_CHECK stmts recorded, so there's
734 nothing to optimize yet. */
735 ptr_checks->safe_push (stmt);
736 if (base_checks)
737 base_checks->safe_push (stmt);
738 return false;
741 bool remove = false;
743 if (ptr_checks)
744 remove = can_remove_asan_check (*ptr_checks, len, bb);
746 if (!remove && base_checks)
747 /* Try with base address as well. */
748 remove = can_remove_asan_check (*base_checks, len, bb);
750 if (!remove)
752 ptr_checks->safe_push (stmt);
753 if (base_checks)
754 base_checks->safe_push (stmt);
757 return remove;
760 /* Try to optimize away redundant UBSAN_NULL and ASAN_CHECK calls.
762 We walk blocks in the CFG via a depth first search of the dominator
763 tree; we push unique UBSAN_NULL or ASAN_CHECK statements into a vector
764 in the NULL_CHECK_MAP or ASAN_CHECK_MAP hash maps as we enter the
765 blocks. When leaving a block, we mark the block as visited; then
766 when checking the statements in the vector, we ignore statements that
767 are coming from already visited blocks, because these cannot dominate
768 anything anymore. CTX is a sanopt context. */
770 static void
771 sanopt_optimize_walker (basic_block bb, class sanopt_ctx *ctx)
773 basic_block son;
774 gimple_stmt_iterator gsi;
775 sanopt_info *info = (sanopt_info *) bb->aux;
776 bool asan_check_optimize = (flag_sanitize & SANITIZE_ADDRESS) != 0;
778 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi);)
780 gimple *stmt = gsi_stmt (gsi);
781 bool remove = false;
783 if (!is_gimple_call (stmt))
785 /* Handle asm volatile or asm with "memory" clobber
786 the same as potentionally freeing call. */
787 gasm *asm_stmt = dyn_cast <gasm *> (stmt);
788 if (asm_stmt
789 && asan_check_optimize
790 && (gimple_asm_clobbers_memory_p (asm_stmt)
791 || gimple_asm_volatile_p (asm_stmt)))
792 info->freeing_call_events++;
793 gsi_next (&gsi);
794 continue;
797 if (asan_check_optimize && !nonfreeing_call_p (stmt))
798 info->freeing_call_events++;
800 /* If __asan_before_dynamic_init ("module"); is followed by
801 __asan_after_dynamic_init (); without intervening memory loads/stores,
802 there is nothing to guard, so optimize both away. */
803 if (asan_check_optimize
804 && gimple_call_builtin_p (stmt, BUILT_IN_ASAN_BEFORE_DYNAMIC_INIT))
806 use_operand_p use;
807 gimple *use_stmt;
808 if (single_imm_use (gimple_vdef (stmt), &use, &use_stmt))
810 if (is_gimple_call (use_stmt)
811 && gimple_call_builtin_p (use_stmt,
812 BUILT_IN_ASAN_AFTER_DYNAMIC_INIT))
814 unlink_stmt_vdef (use_stmt);
815 gimple_stmt_iterator gsi2 = gsi_for_stmt (use_stmt);
816 gsi_remove (&gsi2, true);
817 remove = true;
822 if (gimple_call_internal_p (stmt))
823 switch (gimple_call_internal_fn (stmt))
825 case IFN_UBSAN_NULL:
826 remove = maybe_optimize_ubsan_null_ifn (ctx, stmt);
827 break;
828 case IFN_UBSAN_VPTR:
829 remove = maybe_optimize_ubsan_vptr_ifn (ctx, stmt);
830 break;
831 case IFN_UBSAN_PTR:
832 remove = maybe_optimize_ubsan_ptr_ifn (ctx, stmt);
833 break;
834 case IFN_ASAN_CHECK:
835 if (asan_check_optimize)
836 remove = maybe_optimize_asan_check_ifn (ctx, stmt);
837 if (!remove)
838 ctx->asan_num_accesses++;
839 break;
840 case IFN_ASAN_MARK:
841 ctx->contains_asan_mark = true;
842 break;
843 default:
844 break;
847 if (remove)
849 /* Drop this check. */
850 if (dump_file && (dump_flags & TDF_DETAILS))
852 fprintf (dump_file, "Optimizing out: ");
853 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
855 unlink_stmt_vdef (stmt);
856 gsi_remove (&gsi, true);
858 else
860 if (dump_file && (dump_flags & TDF_DETAILS))
862 fprintf (dump_file, "Leaving: ");
863 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
866 gsi_next (&gsi);
870 if (asan_check_optimize)
872 info->has_freeing_call_p = info->freeing_call_events != 0;
873 info->has_freeing_call_computed_p = true;
876 for (son = first_dom_son (CDI_DOMINATORS, bb);
877 son;
878 son = next_dom_son (CDI_DOMINATORS, son))
879 sanopt_optimize_walker (son, ctx);
881 /* We're leaving this BB, so mark it to that effect. */
882 info->visited_p = true;
885 /* Try to remove redundant sanitizer checks in function FUN. */
887 static int
888 sanopt_optimize (function *fun, bool *contains_asan_mark)
890 class sanopt_ctx ctx;
891 ctx.asan_num_accesses = 0;
892 ctx.contains_asan_mark = false;
894 /* Set up block info for each basic block. */
895 alloc_aux_for_blocks (sizeof (sanopt_info));
897 /* We're going to do a dominator walk, so ensure that we have
898 dominance information. */
899 calculate_dominance_info (CDI_DOMINATORS);
901 /* Recursively walk the dominator tree optimizing away
902 redundant checks. */
903 sanopt_optimize_walker (ENTRY_BLOCK_PTR_FOR_FN (fun), &ctx);
905 free_aux_for_blocks ();
907 *contains_asan_mark = ctx.contains_asan_mark;
908 return ctx.asan_num_accesses;
911 /* Perform optimization of sanitize functions. */
913 namespace {
915 const pass_data pass_data_sanopt =
917 GIMPLE_PASS, /* type */
918 "sanopt", /* name */
919 OPTGROUP_NONE, /* optinfo_flags */
920 TV_NONE, /* tv_id */
921 ( PROP_ssa | PROP_cfg | PROP_gimple_leh ), /* properties_required */
922 0, /* properties_provided */
923 0, /* properties_destroyed */
924 0, /* todo_flags_start */
925 TODO_update_ssa, /* todo_flags_finish */
928 class pass_sanopt : public gimple_opt_pass
930 public:
931 pass_sanopt (gcc::context *ctxt)
932 : gimple_opt_pass (pass_data_sanopt, ctxt)
935 /* opt_pass methods: */
936 virtual bool gate (function *) { return flag_sanitize; }
937 virtual unsigned int execute (function *);
939 }; // class pass_sanopt
941 /* Sanitize all ASAN_MARK unpoison calls that are not reachable by a BB
942 that contains an ASAN_MARK poison. All these ASAN_MARK unpoison call
943 can be removed as all variables are unpoisoned in a function prologue. */
945 static void
946 sanitize_asan_mark_unpoison (void)
948 /* 1) Find all BBs that contain an ASAN_MARK poison call. */
949 auto_sbitmap with_poison (last_basic_block_for_fn (cfun) + 1);
950 bitmap_clear (with_poison);
951 basic_block bb;
953 FOR_EACH_BB_FN (bb, cfun)
955 if (bitmap_bit_p (with_poison, bb->index))
956 continue;
958 gimple_stmt_iterator gsi;
959 for (gsi = gsi_last_bb (bb); !gsi_end_p (gsi); gsi_prev (&gsi))
961 gimple *stmt = gsi_stmt (gsi);
962 if (asan_mark_p (stmt, ASAN_MARK_POISON))
964 bitmap_set_bit (with_poison, bb->index);
965 break;
970 auto_sbitmap poisoned (last_basic_block_for_fn (cfun) + 1);
971 bitmap_clear (poisoned);
972 auto_sbitmap worklist (last_basic_block_for_fn (cfun) + 1);
973 bitmap_copy (worklist, with_poison);
975 /* 2) Propagate the information to all reachable blocks. */
976 while (!bitmap_empty_p (worklist))
978 unsigned i = bitmap_first_set_bit (worklist);
979 bitmap_clear_bit (worklist, i);
980 basic_block bb = BASIC_BLOCK_FOR_FN (cfun, i);
981 gcc_assert (bb);
983 edge e;
984 edge_iterator ei;
985 FOR_EACH_EDGE (e, ei, bb->succs)
986 if (!bitmap_bit_p (poisoned, e->dest->index))
988 bitmap_set_bit (poisoned, e->dest->index);
989 bitmap_set_bit (worklist, e->dest->index);
993 /* 3) Iterate all BBs not included in POISONED BBs and remove unpoison
994 ASAN_MARK preceding an ASAN_MARK poison (which can still happen). */
995 FOR_EACH_BB_FN (bb, cfun)
997 if (bitmap_bit_p (poisoned, bb->index))
998 continue;
1000 gimple_stmt_iterator gsi;
1001 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi);)
1003 gimple *stmt = gsi_stmt (gsi);
1004 if (gimple_call_internal_p (stmt, IFN_ASAN_MARK))
1006 if (asan_mark_p (stmt, ASAN_MARK_POISON))
1007 break;
1008 else
1010 if (dump_file)
1011 fprintf (dump_file, "Removing ASAN_MARK unpoison\n");
1012 unlink_stmt_vdef (stmt);
1013 release_defs (stmt);
1014 gsi_remove (&gsi, true);
1015 continue;
1019 gsi_next (&gsi);
1024 /* Return true when STMT is either ASAN_CHECK call or a call of a function
1025 that can contain an ASAN_CHECK. */
1027 static bool
1028 maybe_contains_asan_check (gimple *stmt)
1030 if (is_gimple_call (stmt))
1032 if (gimple_call_internal_p (stmt, IFN_ASAN_MARK))
1033 return false;
1034 else
1035 return !(gimple_call_flags (stmt) & ECF_CONST);
1037 else if (is_a<gasm *> (stmt))
1038 return true;
1040 return false;
1043 /* Sanitize all ASAN_MARK poison calls that are not followed by an ASAN_CHECK
1044 call. These calls can be removed. */
1046 static void
1047 sanitize_asan_mark_poison (void)
1049 /* 1) Find all BBs that possibly contain an ASAN_CHECK. */
1050 auto_sbitmap with_check (last_basic_block_for_fn (cfun) + 1);
1051 bitmap_clear (with_check);
1052 basic_block bb;
1054 FOR_EACH_BB_FN (bb, cfun)
1056 gimple_stmt_iterator gsi;
1057 for (gsi = gsi_last_bb (bb); !gsi_end_p (gsi); gsi_prev (&gsi))
1059 gimple *stmt = gsi_stmt (gsi);
1060 if (maybe_contains_asan_check (stmt))
1062 bitmap_set_bit (with_check, bb->index);
1063 break;
1068 auto_sbitmap can_reach_check (last_basic_block_for_fn (cfun) + 1);
1069 bitmap_clear (can_reach_check);
1070 auto_sbitmap worklist (last_basic_block_for_fn (cfun) + 1);
1071 bitmap_copy (worklist, with_check);
1073 /* 2) Propagate the information to all definitions blocks. */
1074 while (!bitmap_empty_p (worklist))
1076 unsigned i = bitmap_first_set_bit (worklist);
1077 bitmap_clear_bit (worklist, i);
1078 basic_block bb = BASIC_BLOCK_FOR_FN (cfun, i);
1079 gcc_assert (bb);
1081 edge e;
1082 edge_iterator ei;
1083 FOR_EACH_EDGE (e, ei, bb->preds)
1084 if (!bitmap_bit_p (can_reach_check, e->src->index))
1086 bitmap_set_bit (can_reach_check, e->src->index);
1087 bitmap_set_bit (worklist, e->src->index);
1091 /* 3) Iterate all BBs not included in CAN_REACH_CHECK BBs and remove poison
1092 ASAN_MARK not followed by a call to function having an ASAN_CHECK. */
1093 FOR_EACH_BB_FN (bb, cfun)
1095 if (bitmap_bit_p (can_reach_check, bb->index))
1096 continue;
1098 gimple_stmt_iterator gsi;
1099 for (gsi = gsi_last_bb (bb); !gsi_end_p (gsi);)
1101 gimple *stmt = gsi_stmt (gsi);
1102 if (maybe_contains_asan_check (stmt))
1103 break;
1104 else if (asan_mark_p (stmt, ASAN_MARK_POISON))
1106 if (dump_file)
1107 fprintf (dump_file, "Removing ASAN_MARK poison\n");
1108 unlink_stmt_vdef (stmt);
1109 release_defs (stmt);
1110 gimple_stmt_iterator gsi2 = gsi;
1111 gsi_prev (&gsi);
1112 gsi_remove (&gsi2, true);
1113 continue;
1116 gsi_prev (&gsi);
1121 /* Rewrite all usages of tree OP which is a PARM_DECL with a VAR_DECL
1122 that is it's DECL_VALUE_EXPR. */
1124 static tree
1125 rewrite_usage_of_param (tree *op, int *walk_subtrees, void *)
1127 if (TREE_CODE (*op) == PARM_DECL && DECL_HAS_VALUE_EXPR_P (*op))
1129 *op = DECL_VALUE_EXPR (*op);
1130 *walk_subtrees = 0;
1133 return NULL;
1136 /* For a given function FUN, rewrite all addressable parameters so that
1137 a new automatic variable is introduced. Right after function entry
1138 a parameter is assigned to the variable. */
1140 static void
1141 sanitize_rewrite_addressable_params (function *fun)
1143 gimple *g;
1144 gimple_seq stmts = NULL;
1145 bool has_any_addressable_param = false;
1146 auto_vec<tree> clear_value_expr_list;
1148 for (tree arg = DECL_ARGUMENTS (current_function_decl);
1149 arg; arg = DECL_CHAIN (arg))
1151 tree type = TREE_TYPE (arg);
1152 if (TREE_ADDRESSABLE (arg)
1153 && !TREE_ADDRESSABLE (type)
1154 && !TREE_THIS_VOLATILE (arg)
1155 && TREE_CODE (TYPE_SIZE (type)) == INTEGER_CST)
1157 TREE_ADDRESSABLE (arg) = 0;
1158 /* The parameter is no longer addressable. */
1159 has_any_addressable_param = true;
1161 /* Create a new automatic variable. */
1162 tree var = build_decl (DECL_SOURCE_LOCATION (arg),
1163 VAR_DECL, DECL_NAME (arg), type);
1164 TREE_ADDRESSABLE (var) = 1;
1165 DECL_IGNORED_P (var) = 1;
1167 gimple_add_tmp_var (var);
1169 /* We skip parameters that have a DECL_VALUE_EXPR. */
1170 if (DECL_HAS_VALUE_EXPR_P (arg))
1171 continue;
1173 if (dump_file)
1174 fprintf (dump_file,
1175 "Rewriting parameter whose address is taken: %s\n",
1176 IDENTIFIER_POINTER (DECL_NAME (arg)));
1178 SET_DECL_PT_UID (var, DECL_PT_UID (arg));
1180 /* Assign value of parameter to newly created variable. */
1181 if ((TREE_CODE (type) == COMPLEX_TYPE
1182 || TREE_CODE (type) == VECTOR_TYPE))
1184 /* We need to create a SSA name that will be used for the
1185 assignment. */
1186 DECL_GIMPLE_REG_P (arg) = 1;
1187 tree tmp = get_or_create_ssa_default_def (cfun, arg);
1188 g = gimple_build_assign (var, tmp);
1189 gimple_set_location (g, DECL_SOURCE_LOCATION (arg));
1190 gimple_seq_add_stmt (&stmts, g);
1192 else
1194 g = gimple_build_assign (var, arg);
1195 gimple_set_location (g, DECL_SOURCE_LOCATION (arg));
1196 gimple_seq_add_stmt (&stmts, g);
1199 if (target_for_debug_bind (arg))
1201 g = gimple_build_debug_bind (arg, var, NULL);
1202 gimple_seq_add_stmt (&stmts, g);
1203 clear_value_expr_list.safe_push (arg);
1206 DECL_HAS_VALUE_EXPR_P (arg) = 1;
1207 SET_DECL_VALUE_EXPR (arg, var);
1211 if (!has_any_addressable_param)
1212 return;
1214 /* Replace all usages of PARM_DECLs with the newly
1215 created variable VAR. */
1216 basic_block bb;
1217 FOR_EACH_BB_FN (bb, fun)
1219 gimple_stmt_iterator gsi;
1220 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1222 gimple *stmt = gsi_stmt (gsi);
1223 gimple_stmt_iterator it = gsi_for_stmt (stmt);
1224 walk_gimple_stmt (&it, NULL, rewrite_usage_of_param, NULL);
1226 for (gsi = gsi_start_phis (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1228 gphi *phi = dyn_cast<gphi *> (gsi_stmt (gsi));
1229 for (unsigned i = 0; i < gimple_phi_num_args (phi); ++i)
1231 hash_set<tree> visited_nodes;
1232 walk_tree (gimple_phi_arg_def_ptr (phi, i),
1233 rewrite_usage_of_param, NULL, &visited_nodes);
1238 /* Unset value expr for parameters for which we created debug bind
1239 expressions. */
1240 unsigned i;
1241 tree arg;
1242 FOR_EACH_VEC_ELT (clear_value_expr_list, i, arg)
1244 DECL_HAS_VALUE_EXPR_P (arg) = 0;
1245 SET_DECL_VALUE_EXPR (arg, NULL_TREE);
1248 /* Insert default assignments at the beginning of a function. */
1249 basic_block entry_bb = ENTRY_BLOCK_PTR_FOR_FN (fun);
1250 entry_bb = split_edge (single_succ_edge (entry_bb));
1252 gimple_stmt_iterator gsi = gsi_start_bb (entry_bb);
1253 gsi_insert_seq_before (&gsi, stmts, GSI_NEW_STMT);
1256 unsigned int
1257 pass_sanopt::execute (function *fun)
1259 basic_block bb;
1260 int asan_num_accesses = 0;
1261 bool contains_asan_mark = false;
1263 /* Try to remove redundant checks. */
1264 if (optimize
1265 && (flag_sanitize
1266 & (SANITIZE_NULL | SANITIZE_ALIGNMENT
1267 | SANITIZE_ADDRESS | SANITIZE_VPTR | SANITIZE_POINTER_OVERFLOW)))
1268 asan_num_accesses = sanopt_optimize (fun, &contains_asan_mark);
1269 else if (flag_sanitize & SANITIZE_ADDRESS)
1271 gimple_stmt_iterator gsi;
1272 FOR_EACH_BB_FN (bb, fun)
1273 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1275 gimple *stmt = gsi_stmt (gsi);
1276 if (gimple_call_internal_p (stmt, IFN_ASAN_CHECK))
1277 ++asan_num_accesses;
1278 else if (gimple_call_internal_p (stmt, IFN_ASAN_MARK))
1279 contains_asan_mark = true;
1283 if (contains_asan_mark)
1285 sanitize_asan_mark_unpoison ();
1286 sanitize_asan_mark_poison ();
1289 if (asan_sanitize_stack_p ())
1290 sanitize_rewrite_addressable_params (fun);
1292 bool use_calls = ASAN_INSTRUMENTATION_WITH_CALL_THRESHOLD < INT_MAX
1293 && asan_num_accesses >= ASAN_INSTRUMENTATION_WITH_CALL_THRESHOLD;
1295 hash_map<tree, tree> shadow_vars_mapping;
1296 bool need_commit_edge_insert = false;
1297 FOR_EACH_BB_FN (bb, fun)
1299 gimple_stmt_iterator gsi;
1300 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); )
1302 gimple *stmt = gsi_stmt (gsi);
1303 bool no_next = false;
1305 if (!is_gimple_call (stmt))
1307 gsi_next (&gsi);
1308 continue;
1311 if (gimple_call_internal_p (stmt))
1313 enum internal_fn ifn = gimple_call_internal_fn (stmt);
1314 switch (ifn)
1316 case IFN_UBSAN_NULL:
1317 no_next = ubsan_expand_null_ifn (&gsi);
1318 break;
1319 case IFN_UBSAN_BOUNDS:
1320 no_next = ubsan_expand_bounds_ifn (&gsi);
1321 break;
1322 case IFN_UBSAN_OBJECT_SIZE:
1323 no_next = ubsan_expand_objsize_ifn (&gsi);
1324 break;
1325 case IFN_UBSAN_PTR:
1326 no_next = ubsan_expand_ptr_ifn (&gsi);
1327 break;
1328 case IFN_UBSAN_VPTR:
1329 no_next = ubsan_expand_vptr_ifn (&gsi);
1330 break;
1331 case IFN_ASAN_CHECK:
1332 no_next = asan_expand_check_ifn (&gsi, use_calls);
1333 break;
1334 case IFN_ASAN_MARK:
1335 no_next = asan_expand_mark_ifn (&gsi);
1336 break;
1337 case IFN_ASAN_POISON:
1338 no_next = asan_expand_poison_ifn (&gsi,
1339 &need_commit_edge_insert,
1340 shadow_vars_mapping);
1341 break;
1342 default:
1343 break;
1346 else if (gimple_call_builtin_p (stmt, BUILT_IN_NORMAL))
1348 tree callee = gimple_call_fndecl (stmt);
1349 switch (DECL_FUNCTION_CODE (callee))
1351 case BUILT_IN_UNREACHABLE:
1352 if (sanitize_flags_p (SANITIZE_UNREACHABLE))
1353 no_next = ubsan_instrument_unreachable (&gsi);
1354 break;
1355 default:
1356 break;
1360 if (dump_file && (dump_flags & TDF_DETAILS))
1362 fprintf (dump_file, "Expanded: ");
1363 print_gimple_stmt (dump_file, stmt, 0, dump_flags);
1366 if (!no_next)
1367 gsi_next (&gsi);
1371 if (need_commit_edge_insert)
1372 gsi_commit_edge_inserts ();
1374 return 0;
1377 } // anon namespace
1379 gimple_opt_pass *
1380 make_pass_sanopt (gcc::context *ctxt)
1382 return new pass_sanopt (ctxt);