PR sanitizer/80067
[official-gcc.git] / gcc / tree-ssa-strlen.c
blob141115ed12b3626ee82be2c592a72c99376d14dd
1 /* String length optimization
2 Copyright (C) 2011-2017 Free Software Foundation, Inc.
3 Contributed by Jakub Jelinek <jakub@redhat.com>
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
10 any later version.
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "backend.h"
25 #include "rtl.h"
26 #include "tree.h"
27 #include "gimple.h"
28 #include "alloc-pool.h"
29 #include "tree-pass.h"
30 #include "ssa.h"
31 #include "cgraph.h"
32 #include "gimple-pretty-print.h"
33 #include "fold-const.h"
34 #include "stor-layout.h"
35 #include "gimple-fold.h"
36 #include "tree-eh.h"
37 #include "gimplify.h"
38 #include "gimple-iterator.h"
39 #include "gimplify-me.h"
40 #include "expr.h"
41 #include "tree-dfa.h"
42 #include "domwalk.h"
43 #include "tree-ssa-propagate.h"
44 #include "params.h"
45 #include "ipa-chkp.h"
46 #include "tree-hash-traits.h"
47 #include "builtins.h"
49 /* A vector indexed by SSA_NAME_VERSION. 0 means unknown, positive value
50 is an index into strinfo vector, negative value stands for
51 string length of a string literal (~strlen). */
52 static vec<int> ssa_ver_to_stridx;
54 /* Number of currently active string indexes plus one. */
55 static int max_stridx;
57 /* String information record. */
58 struct strinfo
60 /* String length of this string. */
61 tree length;
62 /* Any of the corresponding pointers for querying alias oracle. */
63 tree ptr;
64 /* Statement for delayed length computation. */
65 gimple *stmt;
66 /* Pointer to '\0' if known, if NULL, it can be computed as
67 ptr + length. */
68 tree endptr;
69 /* Reference count. Any changes to strinfo entry possibly shared
70 with dominating basic blocks need unshare_strinfo first, except
71 for dont_invalidate which affects only the immediately next
72 maybe_invalidate. */
73 int refcount;
74 /* Copy of index. get_strinfo (si->idx) should return si; */
75 int idx;
76 /* These 3 fields are for chaining related string pointers together.
77 E.g. for
78 bl = strlen (b); dl = strlen (d); strcpy (a, b); c = a + bl;
79 strcpy (c, d); e = c + dl;
80 strinfo(a) -> strinfo(c) -> strinfo(e)
81 All have ->first field equal to strinfo(a)->idx and are doubly
82 chained through prev/next fields. The later strinfos are required
83 to point into the same string with zero or more bytes after
84 the previous pointer and all bytes in between the two pointers
85 must be non-zero. Functions like strcpy or memcpy are supposed
86 to adjust all previous strinfo lengths, but not following strinfo
87 lengths (those are uncertain, usually invalidated during
88 maybe_invalidate, except when the alias oracle knows better).
89 Functions like strcat on the other side adjust the whole
90 related strinfo chain.
91 They are updated lazily, so to use the chain the same first fields
92 and si->prev->next == si->idx needs to be verified. */
93 int first;
94 int next;
95 int prev;
96 /* A flag whether the string is known to be written in the current
97 function. */
98 bool writable;
99 /* A flag for the next maybe_invalidate that this strinfo shouldn't
100 be invalidated. Always cleared by maybe_invalidate. */
101 bool dont_invalidate;
104 /* Pool for allocating strinfo_struct entries. */
105 static object_allocator<strinfo> strinfo_pool ("strinfo pool");
107 /* Vector mapping positive string indexes to strinfo, for the
108 current basic block. The first pointer in the vector is special,
109 it is either NULL, meaning the vector isn't shared, or it is
110 a basic block pointer to the owner basic_block if shared.
111 If some other bb wants to modify the vector, the vector needs
112 to be unshared first, and only the owner bb is supposed to free it. */
113 static vec<strinfo *, va_heap, vl_embed> *stridx_to_strinfo;
115 /* One OFFSET->IDX mapping. */
116 struct stridxlist
118 struct stridxlist *next;
119 HOST_WIDE_INT offset;
120 int idx;
123 /* Hash table entry, mapping a DECL to a chain of OFFSET->IDX mappings. */
124 struct decl_stridxlist_map
126 struct tree_map_base base;
127 struct stridxlist list;
130 /* Hash table for mapping decls to a chained list of offset -> idx
131 mappings. */
132 static hash_map<tree_decl_hash, stridxlist> *decl_to_stridxlist_htab;
134 /* Obstack for struct stridxlist and struct decl_stridxlist_map. */
135 static struct obstack stridx_obstack;
137 /* Last memcpy statement if it could be adjusted if the trailing
138 '\0' written is immediately overwritten, or
139 *x = '\0' store that could be removed if it is immediately overwritten. */
140 struct laststmt_struct
142 gimple *stmt;
143 tree len;
144 int stridx;
145 } laststmt;
147 static int get_stridx_plus_constant (strinfo *, HOST_WIDE_INT, tree);
149 /* Return strinfo vector entry IDX. */
151 static inline strinfo *
152 get_strinfo (int idx)
154 if (vec_safe_length (stridx_to_strinfo) <= (unsigned int) idx)
155 return NULL;
156 return (*stridx_to_strinfo)[idx];
159 /* Helper function for get_stridx. */
161 static int
162 get_addr_stridx (tree exp, tree ptr)
164 HOST_WIDE_INT off;
165 struct stridxlist *list, *last = NULL;
166 tree base;
168 if (!decl_to_stridxlist_htab)
169 return 0;
171 base = get_addr_base_and_unit_offset (exp, &off);
172 if (base == NULL || !DECL_P (base))
173 return 0;
175 list = decl_to_stridxlist_htab->get (base);
176 if (list == NULL)
177 return 0;
181 if (list->offset == off)
182 return list->idx;
183 if (list->offset > off)
184 return 0;
185 last = list;
186 list = list->next;
188 while (list);
190 if (ptr && last && last->idx > 0)
192 strinfo *si = get_strinfo (last->idx);
193 if (si
194 && si->length
195 && TREE_CODE (si->length) == INTEGER_CST
196 && compare_tree_int (si->length, off - last->offset) != -1)
197 return get_stridx_plus_constant (si, off - last->offset, ptr);
199 return 0;
202 /* Return string index for EXP. */
204 static int
205 get_stridx (tree exp)
207 tree s, o;
209 if (TREE_CODE (exp) == SSA_NAME)
211 if (ssa_ver_to_stridx[SSA_NAME_VERSION (exp)])
212 return ssa_ver_to_stridx[SSA_NAME_VERSION (exp)];
213 int i;
214 tree e = exp;
215 HOST_WIDE_INT off = 0;
216 for (i = 0; i < 5; i++)
218 gimple *def_stmt = SSA_NAME_DEF_STMT (e);
219 if (!is_gimple_assign (def_stmt)
220 || gimple_assign_rhs_code (def_stmt) != POINTER_PLUS_EXPR)
221 return 0;
222 tree rhs1 = gimple_assign_rhs1 (def_stmt);
223 tree rhs2 = gimple_assign_rhs2 (def_stmt);
224 if (TREE_CODE (rhs1) != SSA_NAME
225 || !tree_fits_shwi_p (rhs2))
226 return 0;
227 HOST_WIDE_INT this_off = tree_to_shwi (rhs2);
228 if (this_off < 0)
229 return 0;
230 off = (unsigned HOST_WIDE_INT) off + this_off;
231 if (off < 0)
232 return 0;
233 if (ssa_ver_to_stridx[SSA_NAME_VERSION (rhs1)])
235 strinfo *si
236 = get_strinfo (ssa_ver_to_stridx[SSA_NAME_VERSION (rhs1)]);
237 if (si
238 && si->length
239 && TREE_CODE (si->length) == INTEGER_CST
240 && compare_tree_int (si->length, off) != -1)
241 return get_stridx_plus_constant (si, off, exp);
243 e = rhs1;
245 return 0;
248 if (TREE_CODE (exp) == ADDR_EXPR)
250 int idx = get_addr_stridx (TREE_OPERAND (exp, 0), exp);
251 if (idx != 0)
252 return idx;
255 s = string_constant (exp, &o);
256 if (s != NULL_TREE
257 && (o == NULL_TREE || tree_fits_shwi_p (o))
258 && TREE_STRING_LENGTH (s) > 0)
260 HOST_WIDE_INT offset = o ? tree_to_shwi (o) : 0;
261 const char *p = TREE_STRING_POINTER (s);
262 int max = TREE_STRING_LENGTH (s) - 1;
264 if (p[max] == '\0' && offset >= 0 && offset <= max)
265 return ~(int) strlen (p + offset);
267 return 0;
270 /* Return true if strinfo vector is shared with the immediate dominator. */
272 static inline bool
273 strinfo_shared (void)
275 return vec_safe_length (stridx_to_strinfo)
276 && (*stridx_to_strinfo)[0] != NULL;
279 /* Unshare strinfo vector that is shared with the immediate dominator. */
281 static void
282 unshare_strinfo_vec (void)
284 strinfo *si;
285 unsigned int i = 0;
287 gcc_assert (strinfo_shared ());
288 stridx_to_strinfo = vec_safe_copy (stridx_to_strinfo);
289 for (i = 1; vec_safe_iterate (stridx_to_strinfo, i, &si); ++i)
290 if (si != NULL)
291 si->refcount++;
292 (*stridx_to_strinfo)[0] = NULL;
295 /* Attempt to create a string index for exp, ADDR_EXPR's operand.
296 Return a pointer to the location where the string index can
297 be stored (if 0) or is stored, or NULL if this can't be tracked. */
299 static int *
300 addr_stridxptr (tree exp)
302 HOST_WIDE_INT off;
304 tree base = get_addr_base_and_unit_offset (exp, &off);
305 if (base == NULL_TREE || !DECL_P (base))
306 return NULL;
308 if (!decl_to_stridxlist_htab)
310 decl_to_stridxlist_htab
311 = new hash_map<tree_decl_hash, stridxlist> (64);
312 gcc_obstack_init (&stridx_obstack);
315 bool existed;
316 stridxlist *list = &decl_to_stridxlist_htab->get_or_insert (base, &existed);
317 if (existed)
319 int i;
320 stridxlist *before = NULL;
321 for (i = 0; i < 32; i++)
323 if (list->offset == off)
324 return &list->idx;
325 if (list->offset > off && before == NULL)
326 before = list;
327 if (list->next == NULL)
328 break;
329 list = list->next;
331 if (i == 32)
332 return NULL;
333 if (before)
335 list = before;
336 before = XOBNEW (&stridx_obstack, struct stridxlist);
337 *before = *list;
338 list->next = before;
339 list->offset = off;
340 list->idx = 0;
341 return &list->idx;
343 list->next = XOBNEW (&stridx_obstack, struct stridxlist);
344 list = list->next;
347 list->next = NULL;
348 list->offset = off;
349 list->idx = 0;
350 return &list->idx;
353 /* Create a new string index, or return 0 if reached limit. */
355 static int
356 new_stridx (tree exp)
358 int idx;
359 if (max_stridx >= PARAM_VALUE (PARAM_MAX_TRACKED_STRLENS))
360 return 0;
361 if (TREE_CODE (exp) == SSA_NAME)
363 if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (exp))
364 return 0;
365 idx = max_stridx++;
366 ssa_ver_to_stridx[SSA_NAME_VERSION (exp)] = idx;
367 return idx;
369 if (TREE_CODE (exp) == ADDR_EXPR)
371 int *pidx = addr_stridxptr (TREE_OPERAND (exp, 0));
372 if (pidx != NULL)
374 gcc_assert (*pidx == 0);
375 *pidx = max_stridx++;
376 return *pidx;
379 return 0;
382 /* Like new_stridx, but for ADDR_EXPR's operand instead. */
384 static int
385 new_addr_stridx (tree exp)
387 int *pidx;
388 if (max_stridx >= PARAM_VALUE (PARAM_MAX_TRACKED_STRLENS))
389 return 0;
390 pidx = addr_stridxptr (exp);
391 if (pidx != NULL)
393 gcc_assert (*pidx == 0);
394 *pidx = max_stridx++;
395 return *pidx;
397 return 0;
400 /* Create a new strinfo. */
402 static strinfo *
403 new_strinfo (tree ptr, int idx, tree length)
405 strinfo *si = strinfo_pool.allocate ();
406 si->length = length;
407 si->ptr = ptr;
408 si->stmt = NULL;
409 si->endptr = NULL_TREE;
410 si->refcount = 1;
411 si->idx = idx;
412 si->first = 0;
413 si->prev = 0;
414 si->next = 0;
415 si->writable = false;
416 si->dont_invalidate = false;
417 return si;
420 /* Decrease strinfo refcount and free it if not referenced anymore. */
422 static inline void
423 free_strinfo (strinfo *si)
425 if (si && --si->refcount == 0)
426 strinfo_pool.remove (si);
429 /* Set strinfo in the vector entry IDX to SI. */
431 static inline void
432 set_strinfo (int idx, strinfo *si)
434 if (vec_safe_length (stridx_to_strinfo) && (*stridx_to_strinfo)[0])
435 unshare_strinfo_vec ();
436 if (vec_safe_length (stridx_to_strinfo) <= (unsigned int) idx)
437 vec_safe_grow_cleared (stridx_to_strinfo, idx + 1);
438 (*stridx_to_strinfo)[idx] = si;
441 /* Return string length, or NULL if it can't be computed. */
443 static tree
444 get_string_length (strinfo *si)
446 if (si->length)
447 return si->length;
449 if (si->stmt)
451 gimple *stmt = si->stmt, *lenstmt;
452 bool with_bounds = gimple_call_with_bounds_p (stmt);
453 tree callee, lhs, fn, tem;
454 location_t loc;
455 gimple_stmt_iterator gsi;
457 gcc_assert (is_gimple_call (stmt));
458 callee = gimple_call_fndecl (stmt);
459 gcc_assert (callee && DECL_BUILT_IN_CLASS (callee) == BUILT_IN_NORMAL);
460 lhs = gimple_call_lhs (stmt);
461 /* unshare_strinfo is intentionally not called here. The (delayed)
462 transformation of strcpy or strcat into stpcpy is done at the place
463 of the former strcpy/strcat call and so can affect all the strinfos
464 with the same stmt. If they were unshared before and transformation
465 has been already done, the handling of BUILT_IN_STPCPY{,_CHK} should
466 just compute the right length. */
467 switch (DECL_FUNCTION_CODE (callee))
469 case BUILT_IN_STRCAT:
470 case BUILT_IN_STRCAT_CHK:
471 case BUILT_IN_STRCAT_CHKP:
472 case BUILT_IN_STRCAT_CHK_CHKP:
473 gsi = gsi_for_stmt (stmt);
474 fn = builtin_decl_implicit (BUILT_IN_STRLEN);
475 gcc_assert (lhs == NULL_TREE);
476 tem = unshare_expr (gimple_call_arg (stmt, 0));
477 if (with_bounds)
479 lenstmt = gimple_build_call (chkp_maybe_create_clone (fn)->decl,
480 2, tem, gimple_call_arg (stmt, 1));
481 gimple_call_set_with_bounds (lenstmt, true);
483 else
484 lenstmt = gimple_build_call (fn, 1, tem);
485 lhs = make_ssa_name (TREE_TYPE (TREE_TYPE (fn)), lenstmt);
486 gimple_call_set_lhs (lenstmt, lhs);
487 gimple_set_vuse (lenstmt, gimple_vuse (stmt));
488 gsi_insert_before (&gsi, lenstmt, GSI_SAME_STMT);
489 tem = gimple_call_arg (stmt, 0);
490 if (!ptrofftype_p (TREE_TYPE (lhs)))
492 lhs = convert_to_ptrofftype (lhs);
493 lhs = force_gimple_operand_gsi (&gsi, lhs, true, NULL_TREE,
494 true, GSI_SAME_STMT);
496 lenstmt = gimple_build_assign
497 (make_ssa_name (TREE_TYPE (gimple_call_arg (stmt, 0))),
498 POINTER_PLUS_EXPR,tem, lhs);
499 gsi_insert_before (&gsi, lenstmt, GSI_SAME_STMT);
500 gimple_call_set_arg (stmt, 0, gimple_assign_lhs (lenstmt));
501 lhs = NULL_TREE;
502 /* FALLTHRU */
503 case BUILT_IN_STRCPY:
504 case BUILT_IN_STRCPY_CHK:
505 case BUILT_IN_STRCPY_CHKP:
506 case BUILT_IN_STRCPY_CHK_CHKP:
507 gcc_assert (builtin_decl_implicit_p (BUILT_IN_STPCPY));
508 if (gimple_call_num_args (stmt) == (with_bounds ? 4 : 2))
509 fn = builtin_decl_implicit (BUILT_IN_STPCPY);
510 else
511 fn = builtin_decl_explicit (BUILT_IN_STPCPY_CHK);
512 if (with_bounds)
513 fn = chkp_maybe_create_clone (fn)->decl;
514 gcc_assert (lhs == NULL_TREE);
515 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
517 fprintf (dump_file, "Optimizing: ");
518 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
520 gimple_call_set_fndecl (stmt, fn);
521 lhs = make_ssa_name (TREE_TYPE (TREE_TYPE (fn)), stmt);
522 gimple_call_set_lhs (stmt, lhs);
523 update_stmt (stmt);
524 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
526 fprintf (dump_file, "into: ");
527 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
529 /* FALLTHRU */
530 case BUILT_IN_STPCPY:
531 case BUILT_IN_STPCPY_CHK:
532 case BUILT_IN_STPCPY_CHKP:
533 case BUILT_IN_STPCPY_CHK_CHKP:
534 gcc_assert (lhs != NULL_TREE);
535 loc = gimple_location (stmt);
536 si->endptr = lhs;
537 si->stmt = NULL;
538 lhs = fold_convert_loc (loc, size_type_node, lhs);
539 si->length = fold_convert_loc (loc, size_type_node, si->ptr);
540 si->length = fold_build2_loc (loc, MINUS_EXPR, size_type_node,
541 lhs, si->length);
542 break;
543 case BUILT_IN_MALLOC:
544 break;
545 /* BUILT_IN_CALLOC always has si->length set. */
546 default:
547 gcc_unreachable ();
548 break;
552 return si->length;
555 /* Invalidate string length information for strings whose length
556 might change due to stores in stmt. */
558 static bool
559 maybe_invalidate (gimple *stmt)
561 strinfo *si;
562 unsigned int i;
563 bool nonempty = false;
565 for (i = 1; vec_safe_iterate (stridx_to_strinfo, i, &si); ++i)
566 if (si != NULL)
568 if (!si->dont_invalidate)
570 ao_ref r;
571 /* Do not use si->length. */
572 ao_ref_init_from_ptr_and_size (&r, si->ptr, NULL_TREE);
573 if (stmt_may_clobber_ref_p_1 (stmt, &r))
575 set_strinfo (i, NULL);
576 free_strinfo (si);
577 continue;
580 si->dont_invalidate = false;
581 nonempty = true;
583 return nonempty;
586 /* Unshare strinfo record SI, if it has refcount > 1 or
587 if stridx_to_strinfo vector is shared with some other
588 bbs. */
590 static strinfo *
591 unshare_strinfo (strinfo *si)
593 strinfo *nsi;
595 if (si->refcount == 1 && !strinfo_shared ())
596 return si;
598 nsi = new_strinfo (si->ptr, si->idx, si->length);
599 nsi->stmt = si->stmt;
600 nsi->endptr = si->endptr;
601 nsi->first = si->first;
602 nsi->prev = si->prev;
603 nsi->next = si->next;
604 nsi->writable = si->writable;
605 set_strinfo (si->idx, nsi);
606 free_strinfo (si);
607 return nsi;
610 /* Return first strinfo in the related strinfo chain
611 if all strinfos in between belong to the chain, otherwise
612 NULL. */
614 static strinfo *
615 verify_related_strinfos (strinfo *origsi)
617 strinfo *si = origsi, *psi;
619 if (origsi->first == 0)
620 return NULL;
621 for (; si->prev; si = psi)
623 if (si->first != origsi->first)
624 return NULL;
625 psi = get_strinfo (si->prev);
626 if (psi == NULL)
627 return NULL;
628 if (psi->next != si->idx)
629 return NULL;
631 if (si->idx != si->first)
632 return NULL;
633 return si;
636 /* Attempt to create a new strinfo for BASESI + OFF, or find existing
637 strinfo if there is any. Return it's idx, or 0 if no strinfo has
638 been created. */
640 static int
641 get_stridx_plus_constant (strinfo *basesi, HOST_WIDE_INT off, tree ptr)
643 if (TREE_CODE (ptr) == SSA_NAME && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (ptr))
644 return 0;
646 if (basesi->length == NULL_TREE
647 || TREE_CODE (basesi->length) != INTEGER_CST
648 || compare_tree_int (basesi->length, off) == -1
649 || !tree_fits_shwi_p (basesi->length))
650 return 0;
652 HOST_WIDE_INT len = tree_to_shwi (basesi->length) - off;
653 strinfo *si = basesi, *chainsi;
654 if (si->first || si->prev || si->next)
655 si = verify_related_strinfos (basesi);
656 if (si == NULL
657 || si->length == NULL_TREE
658 || TREE_CODE (si->length) != INTEGER_CST)
659 return 0;
661 if (TREE_CODE (ptr) == SSA_NAME
662 && ssa_ver_to_stridx.length () <= SSA_NAME_VERSION (ptr))
663 ssa_ver_to_stridx.safe_grow_cleared (num_ssa_names);
665 gcc_checking_assert (compare_tree_int (si->length, off) != -1);
666 for (chainsi = si; chainsi->next; chainsi = si)
668 si = get_strinfo (chainsi->next);
669 if (si == NULL
670 || si->first != chainsi->first
671 || si->prev != chainsi->idx
672 || si->length == NULL_TREE
673 || TREE_CODE (si->length) != INTEGER_CST)
674 break;
675 int r = compare_tree_int (si->length, len);
676 if (r != 1)
678 if (r == 0)
680 if (TREE_CODE (ptr) == SSA_NAME)
681 ssa_ver_to_stridx[SSA_NAME_VERSION (ptr)] = si->idx;
682 else
684 int *pidx = addr_stridxptr (TREE_OPERAND (ptr, 0));
685 if (pidx != NULL && *pidx == 0)
686 *pidx = si->idx;
688 return si->idx;
690 break;
694 int idx = new_stridx (ptr);
695 if (idx == 0)
696 return 0;
697 si = new_strinfo (ptr, idx, build_int_cst (size_type_node, len));
698 set_strinfo (idx, si);
699 if (chainsi->next)
701 strinfo *nextsi = unshare_strinfo (get_strinfo (chainsi->next));
702 si->next = nextsi->idx;
703 nextsi->prev = idx;
705 chainsi = unshare_strinfo (chainsi);
706 if (chainsi->first == 0)
707 chainsi->first = chainsi->idx;
708 chainsi->next = idx;
709 if (chainsi->endptr == NULL_TREE && len == 0)
710 chainsi->endptr = ptr;
711 si->endptr = chainsi->endptr;
712 si->prev = chainsi->idx;
713 si->first = chainsi->first;
714 si->writable = chainsi->writable;
715 return si->idx;
718 /* Note that PTR, a pointer SSA_NAME initialized in the current stmt, points
719 to a zero-length string and if possible chain it to a related strinfo
720 chain whose part is or might be CHAINSI. */
722 static strinfo *
723 zero_length_string (tree ptr, strinfo *chainsi)
725 strinfo *si;
726 int idx;
727 if (ssa_ver_to_stridx.length () <= SSA_NAME_VERSION (ptr))
728 ssa_ver_to_stridx.safe_grow_cleared (num_ssa_names);
729 gcc_checking_assert (TREE_CODE (ptr) == SSA_NAME
730 && ssa_ver_to_stridx[SSA_NAME_VERSION (ptr)] == 0);
732 if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (ptr))
733 return NULL;
734 if (chainsi != NULL)
736 si = verify_related_strinfos (chainsi);
737 if (si)
739 chainsi = si;
740 for (; chainsi->next; chainsi = si)
742 if (chainsi->endptr == NULL_TREE)
744 chainsi = unshare_strinfo (chainsi);
745 chainsi->endptr = ptr;
747 si = get_strinfo (chainsi->next);
748 if (si == NULL
749 || si->first != chainsi->first
750 || si->prev != chainsi->idx)
751 break;
753 gcc_assert (chainsi->length || chainsi->stmt);
754 if (chainsi->endptr == NULL_TREE)
756 chainsi = unshare_strinfo (chainsi);
757 chainsi->endptr = ptr;
759 if (chainsi->length && integer_zerop (chainsi->length))
761 if (chainsi->next)
763 chainsi = unshare_strinfo (chainsi);
764 chainsi->next = 0;
766 ssa_ver_to_stridx[SSA_NAME_VERSION (ptr)] = chainsi->idx;
767 return chainsi;
770 else if (chainsi->first || chainsi->prev || chainsi->next)
772 chainsi = unshare_strinfo (chainsi);
773 chainsi->first = 0;
774 chainsi->prev = 0;
775 chainsi->next = 0;
778 idx = new_stridx (ptr);
779 if (idx == 0)
780 return NULL;
781 si = new_strinfo (ptr, idx, build_int_cst (size_type_node, 0));
782 set_strinfo (idx, si);
783 si->endptr = ptr;
784 if (chainsi != NULL)
786 chainsi = unshare_strinfo (chainsi);
787 if (chainsi->first == 0)
788 chainsi->first = chainsi->idx;
789 chainsi->next = idx;
790 if (chainsi->endptr == NULL_TREE)
791 chainsi->endptr = ptr;
792 si->prev = chainsi->idx;
793 si->first = chainsi->first;
794 si->writable = chainsi->writable;
796 return si;
799 /* For strinfo ORIGSI whose length has been just updated
800 update also related strinfo lengths (add ADJ to each,
801 but don't adjust ORIGSI). */
803 static void
804 adjust_related_strinfos (location_t loc, strinfo *origsi, tree adj)
806 strinfo *si = verify_related_strinfos (origsi);
808 if (si == NULL)
809 return;
811 while (1)
813 strinfo *nsi;
815 if (si != origsi)
817 tree tem;
819 si = unshare_strinfo (si);
820 if (si->length)
822 tem = fold_convert_loc (loc, TREE_TYPE (si->length), adj);
823 si->length = fold_build2_loc (loc, PLUS_EXPR,
824 TREE_TYPE (si->length), si->length,
825 tem);
827 else if (si->stmt != NULL)
828 /* Delayed length computation is unaffected. */
830 else
831 gcc_unreachable ();
833 si->endptr = NULL_TREE;
834 si->dont_invalidate = true;
836 if (si->next == 0)
837 return;
838 nsi = get_strinfo (si->next);
839 if (nsi == NULL
840 || nsi->first != si->first
841 || nsi->prev != si->idx)
842 return;
843 si = nsi;
847 /* Find if there are other SSA_NAME pointers equal to PTR
848 for which we don't track their string lengths yet. If so, use
849 IDX for them. */
851 static void
852 find_equal_ptrs (tree ptr, int idx)
854 if (TREE_CODE (ptr) != SSA_NAME)
855 return;
856 while (1)
858 gimple *stmt = SSA_NAME_DEF_STMT (ptr);
859 if (!is_gimple_assign (stmt))
860 return;
861 ptr = gimple_assign_rhs1 (stmt);
862 switch (gimple_assign_rhs_code (stmt))
864 case SSA_NAME:
865 break;
866 CASE_CONVERT:
867 if (!POINTER_TYPE_P (TREE_TYPE (ptr)))
868 return;
869 if (TREE_CODE (ptr) == SSA_NAME)
870 break;
871 if (TREE_CODE (ptr) != ADDR_EXPR)
872 return;
873 /* FALLTHRU */
874 case ADDR_EXPR:
876 int *pidx = addr_stridxptr (TREE_OPERAND (ptr, 0));
877 if (pidx != NULL && *pidx == 0)
878 *pidx = idx;
879 return;
881 default:
882 return;
885 /* We might find an endptr created in this pass. Grow the
886 vector in that case. */
887 if (ssa_ver_to_stridx.length () <= SSA_NAME_VERSION (ptr))
888 ssa_ver_to_stridx.safe_grow_cleared (num_ssa_names);
890 if (ssa_ver_to_stridx[SSA_NAME_VERSION (ptr)] != 0)
891 return;
892 ssa_ver_to_stridx[SSA_NAME_VERSION (ptr)] = idx;
896 /* Return true if STMT is a call to a builtin function with the right
897 arguments and attributes that should be considered for optimization
898 by this pass. */
900 static bool
901 valid_builtin_call (gimple *stmt)
903 if (!gimple_call_builtin_p (stmt, BUILT_IN_NORMAL))
904 return false;
906 tree callee = gimple_call_fndecl (stmt);
907 switch (DECL_FUNCTION_CODE (callee))
909 case BUILT_IN_MEMCMP:
910 case BUILT_IN_MEMCMP_EQ:
911 case BUILT_IN_STRCHR:
912 case BUILT_IN_STRCHR_CHKP:
913 case BUILT_IN_STRLEN:
914 case BUILT_IN_STRLEN_CHKP:
915 /* The above functions should be pure. Punt if they aren't. */
916 if (gimple_vdef (stmt) || gimple_vuse (stmt) == NULL_TREE)
917 return false;
918 break;
920 case BUILT_IN_CALLOC:
921 case BUILT_IN_MALLOC:
922 case BUILT_IN_MEMCPY:
923 case BUILT_IN_MEMCPY_CHK:
924 case BUILT_IN_MEMCPY_CHKP:
925 case BUILT_IN_MEMCPY_CHK_CHKP:
926 case BUILT_IN_MEMPCPY:
927 case BUILT_IN_MEMPCPY_CHK:
928 case BUILT_IN_MEMPCPY_CHKP:
929 case BUILT_IN_MEMPCPY_CHK_CHKP:
930 case BUILT_IN_MEMSET:
931 case BUILT_IN_STPCPY:
932 case BUILT_IN_STPCPY_CHK:
933 case BUILT_IN_STPCPY_CHKP:
934 case BUILT_IN_STPCPY_CHK_CHKP:
935 case BUILT_IN_STRCAT:
936 case BUILT_IN_STRCAT_CHK:
937 case BUILT_IN_STRCAT_CHKP:
938 case BUILT_IN_STRCAT_CHK_CHKP:
939 case BUILT_IN_STRCPY:
940 case BUILT_IN_STRCPY_CHK:
941 case BUILT_IN_STRCPY_CHKP:
942 case BUILT_IN_STRCPY_CHK_CHKP:
943 /* The above functions should be neither const nor pure. Punt if they
944 aren't. */
945 if (gimple_vdef (stmt) == NULL_TREE || gimple_vuse (stmt) == NULL_TREE)
946 return false;
947 break;
949 default:
950 break;
953 return true;
956 /* If the last .MEM setter statement before STMT is
957 memcpy (x, y, strlen (y) + 1), the only .MEM use of it is STMT
958 and STMT is known to overwrite x[strlen (x)], adjust the last memcpy to
959 just memcpy (x, y, strlen (y)). SI must be the zero length
960 strinfo. */
962 static void
963 adjust_last_stmt (strinfo *si, gimple *stmt, bool is_strcat)
965 tree vuse, callee, len;
966 struct laststmt_struct last = laststmt;
967 strinfo *lastsi, *firstsi;
968 unsigned len_arg_no = 2;
970 laststmt.stmt = NULL;
971 laststmt.len = NULL_TREE;
972 laststmt.stridx = 0;
974 if (last.stmt == NULL)
975 return;
977 vuse = gimple_vuse (stmt);
978 if (vuse == NULL_TREE
979 || SSA_NAME_DEF_STMT (vuse) != last.stmt
980 || !has_single_use (vuse))
981 return;
983 gcc_assert (last.stridx > 0);
984 lastsi = get_strinfo (last.stridx);
985 if (lastsi == NULL)
986 return;
988 if (lastsi != si)
990 if (lastsi->first == 0 || lastsi->first != si->first)
991 return;
993 firstsi = verify_related_strinfos (si);
994 if (firstsi == NULL)
995 return;
996 while (firstsi != lastsi)
998 strinfo *nextsi;
999 if (firstsi->next == 0)
1000 return;
1001 nextsi = get_strinfo (firstsi->next);
1002 if (nextsi == NULL
1003 || nextsi->prev != firstsi->idx
1004 || nextsi->first != si->first)
1005 return;
1006 firstsi = nextsi;
1010 if (!is_strcat)
1012 if (si->length == NULL_TREE || !integer_zerop (si->length))
1013 return;
1016 if (is_gimple_assign (last.stmt))
1018 gimple_stmt_iterator gsi;
1020 if (!integer_zerop (gimple_assign_rhs1 (last.stmt)))
1021 return;
1022 if (stmt_could_throw_p (last.stmt))
1023 return;
1024 gsi = gsi_for_stmt (last.stmt);
1025 unlink_stmt_vdef (last.stmt);
1026 release_defs (last.stmt);
1027 gsi_remove (&gsi, true);
1028 return;
1031 if (!valid_builtin_call (last.stmt))
1032 return;
1034 callee = gimple_call_fndecl (last.stmt);
1035 switch (DECL_FUNCTION_CODE (callee))
1037 case BUILT_IN_MEMCPY:
1038 case BUILT_IN_MEMCPY_CHK:
1039 break;
1040 case BUILT_IN_MEMCPY_CHKP:
1041 case BUILT_IN_MEMCPY_CHK_CHKP:
1042 len_arg_no = 4;
1043 break;
1044 default:
1045 return;
1048 len = gimple_call_arg (last.stmt, len_arg_no);
1049 if (tree_fits_uhwi_p (len))
1051 if (!tree_fits_uhwi_p (last.len)
1052 || integer_zerop (len)
1053 || tree_to_uhwi (len) != tree_to_uhwi (last.len) + 1)
1054 return;
1055 /* Don't adjust the length if it is divisible by 4, it is more efficient
1056 to store the extra '\0' in that case. */
1057 if ((tree_to_uhwi (len) & 3) == 0)
1058 return;
1060 else if (TREE_CODE (len) == SSA_NAME)
1062 gimple *def_stmt = SSA_NAME_DEF_STMT (len);
1063 if (!is_gimple_assign (def_stmt)
1064 || gimple_assign_rhs_code (def_stmt) != PLUS_EXPR
1065 || gimple_assign_rhs1 (def_stmt) != last.len
1066 || !integer_onep (gimple_assign_rhs2 (def_stmt)))
1067 return;
1069 else
1070 return;
1072 gimple_call_set_arg (last.stmt, len_arg_no, last.len);
1073 update_stmt (last.stmt);
1076 /* Handle a strlen call. If strlen of the argument is known, replace
1077 the strlen call with the known value, otherwise remember that strlen
1078 of the argument is stored in the lhs SSA_NAME. */
1080 static void
1081 handle_builtin_strlen (gimple_stmt_iterator *gsi)
1083 int idx;
1084 tree src;
1085 gimple *stmt = gsi_stmt (*gsi);
1086 tree lhs = gimple_call_lhs (stmt);
1088 if (lhs == NULL_TREE)
1089 return;
1091 src = gimple_call_arg (stmt, 0);
1092 idx = get_stridx (src);
1093 if (idx)
1095 strinfo *si = NULL;
1096 tree rhs;
1098 if (idx < 0)
1099 rhs = build_int_cst (TREE_TYPE (lhs), ~idx);
1100 else
1102 rhs = NULL_TREE;
1103 si = get_strinfo (idx);
1104 if (si != NULL)
1105 rhs = get_string_length (si);
1107 if (rhs != NULL_TREE)
1109 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1111 fprintf (dump_file, "Optimizing: ");
1112 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1114 rhs = unshare_expr (rhs);
1115 if (!useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE (rhs)))
1116 rhs = fold_convert_loc (gimple_location (stmt),
1117 TREE_TYPE (lhs), rhs);
1118 if (!update_call_from_tree (gsi, rhs))
1119 gimplify_and_update_call_from_tree (gsi, rhs);
1120 stmt = gsi_stmt (*gsi);
1121 update_stmt (stmt);
1122 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1124 fprintf (dump_file, "into: ");
1125 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1127 if (si != NULL
1128 && TREE_CODE (si->length) != SSA_NAME
1129 && TREE_CODE (si->length) != INTEGER_CST
1130 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (lhs))
1132 si = unshare_strinfo (si);
1133 si->length = lhs;
1135 return;
1138 if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (lhs))
1139 return;
1140 if (idx == 0)
1141 idx = new_stridx (src);
1142 else if (get_strinfo (idx) != NULL)
1143 return;
1144 if (idx)
1146 strinfo *si = new_strinfo (src, idx, lhs);
1147 set_strinfo (idx, si);
1148 find_equal_ptrs (src, idx);
1152 /* Handle a strchr call. If strlen of the first argument is known, replace
1153 the strchr (x, 0) call with the endptr or x + strlen, otherwise remember
1154 that lhs of the call is endptr and strlen of the argument is endptr - x. */
1156 static void
1157 handle_builtin_strchr (gimple_stmt_iterator *gsi)
1159 int idx;
1160 tree src;
1161 gimple *stmt = gsi_stmt (*gsi);
1162 tree lhs = gimple_call_lhs (stmt);
1163 bool with_bounds = gimple_call_with_bounds_p (stmt);
1165 if (lhs == NULL_TREE)
1166 return;
1168 if (!integer_zerop (gimple_call_arg (stmt, with_bounds ? 2 : 1)))
1169 return;
1171 src = gimple_call_arg (stmt, 0);
1172 idx = get_stridx (src);
1173 if (idx)
1175 strinfo *si = NULL;
1176 tree rhs;
1178 if (idx < 0)
1179 rhs = build_int_cst (size_type_node, ~idx);
1180 else
1182 rhs = NULL_TREE;
1183 si = get_strinfo (idx);
1184 if (si != NULL)
1185 rhs = get_string_length (si);
1187 if (rhs != NULL_TREE)
1189 location_t loc = gimple_location (stmt);
1191 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1193 fprintf (dump_file, "Optimizing: ");
1194 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1196 if (si != NULL && si->endptr != NULL_TREE)
1198 rhs = unshare_expr (si->endptr);
1199 if (!useless_type_conversion_p (TREE_TYPE (lhs),
1200 TREE_TYPE (rhs)))
1201 rhs = fold_convert_loc (loc, TREE_TYPE (lhs), rhs);
1203 else
1205 rhs = fold_convert_loc (loc, sizetype, unshare_expr (rhs));
1206 rhs = fold_build2_loc (loc, POINTER_PLUS_EXPR,
1207 TREE_TYPE (src), src, rhs);
1208 if (!useless_type_conversion_p (TREE_TYPE (lhs),
1209 TREE_TYPE (rhs)))
1210 rhs = fold_convert_loc (loc, TREE_TYPE (lhs), rhs);
1212 if (!update_call_from_tree (gsi, rhs))
1213 gimplify_and_update_call_from_tree (gsi, rhs);
1214 stmt = gsi_stmt (*gsi);
1215 update_stmt (stmt);
1216 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1218 fprintf (dump_file, "into: ");
1219 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1221 if (si != NULL
1222 && si->endptr == NULL_TREE
1223 && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (lhs))
1225 si = unshare_strinfo (si);
1226 si->endptr = lhs;
1228 zero_length_string (lhs, si);
1229 return;
1232 if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (lhs))
1233 return;
1234 if (TREE_CODE (src) != SSA_NAME || !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (src))
1236 if (idx == 0)
1237 idx = new_stridx (src);
1238 else if (get_strinfo (idx) != NULL)
1240 zero_length_string (lhs, NULL);
1241 return;
1243 if (idx)
1245 location_t loc = gimple_location (stmt);
1246 tree lhsu = fold_convert_loc (loc, size_type_node, lhs);
1247 tree srcu = fold_convert_loc (loc, size_type_node, src);
1248 tree length = fold_build2_loc (loc, MINUS_EXPR,
1249 size_type_node, lhsu, srcu);
1250 strinfo *si = new_strinfo (src, idx, length);
1251 si->endptr = lhs;
1252 set_strinfo (idx, si);
1253 find_equal_ptrs (src, idx);
1254 zero_length_string (lhs, si);
1257 else
1258 zero_length_string (lhs, NULL);
1261 /* Handle a strcpy-like ({st{r,p}cpy,__st{r,p}cpy_chk}) call.
1262 If strlen of the second argument is known, strlen of the first argument
1263 is the same after this call. Furthermore, attempt to convert it to
1264 memcpy. */
1266 static void
1267 handle_builtin_strcpy (enum built_in_function bcode, gimple_stmt_iterator *gsi)
1269 int idx, didx;
1270 tree src, dst, srclen, len, lhs, args, type, fn, oldlen;
1271 bool success;
1272 gimple *stmt = gsi_stmt (*gsi);
1273 strinfo *si, *dsi, *olddsi, *zsi;
1274 location_t loc;
1275 bool with_bounds = gimple_call_with_bounds_p (stmt);
1277 src = gimple_call_arg (stmt, with_bounds ? 2 : 1);
1278 dst = gimple_call_arg (stmt, 0);
1279 lhs = gimple_call_lhs (stmt);
1280 idx = get_stridx (src);
1281 si = NULL;
1282 if (idx > 0)
1283 si = get_strinfo (idx);
1285 didx = get_stridx (dst);
1286 olddsi = NULL;
1287 oldlen = NULL_TREE;
1288 if (didx > 0)
1289 olddsi = get_strinfo (didx);
1290 else if (didx < 0)
1291 return;
1293 if (olddsi != NULL)
1294 adjust_last_stmt (olddsi, stmt, false);
1296 srclen = NULL_TREE;
1297 if (si != NULL)
1298 srclen = get_string_length (si);
1299 else if (idx < 0)
1300 srclen = build_int_cst (size_type_node, ~idx);
1302 loc = gimple_location (stmt);
1303 if (srclen == NULL_TREE)
1304 switch (bcode)
1306 case BUILT_IN_STRCPY:
1307 case BUILT_IN_STRCPY_CHK:
1308 case BUILT_IN_STRCPY_CHKP:
1309 case BUILT_IN_STRCPY_CHK_CHKP:
1310 if (lhs != NULL_TREE || !builtin_decl_implicit_p (BUILT_IN_STPCPY))
1311 return;
1312 break;
1313 case BUILT_IN_STPCPY:
1314 case BUILT_IN_STPCPY_CHK:
1315 case BUILT_IN_STPCPY_CHKP:
1316 case BUILT_IN_STPCPY_CHK_CHKP:
1317 if (lhs == NULL_TREE)
1318 return;
1319 else
1321 tree lhsuint = fold_convert_loc (loc, size_type_node, lhs);
1322 srclen = fold_convert_loc (loc, size_type_node, dst);
1323 srclen = fold_build2_loc (loc, MINUS_EXPR, size_type_node,
1324 lhsuint, srclen);
1326 break;
1327 default:
1328 gcc_unreachable ();
1331 if (didx == 0)
1333 didx = new_stridx (dst);
1334 if (didx == 0)
1335 return;
1337 if (olddsi != NULL)
1339 oldlen = olddsi->length;
1340 dsi = unshare_strinfo (olddsi);
1341 dsi->length = srclen;
1342 /* Break the chain, so adjust_related_strinfo on later pointers in
1343 the chain won't adjust this one anymore. */
1344 dsi->next = 0;
1345 dsi->stmt = NULL;
1346 dsi->endptr = NULL_TREE;
1348 else
1350 dsi = new_strinfo (dst, didx, srclen);
1351 set_strinfo (didx, dsi);
1352 find_equal_ptrs (dst, didx);
1354 dsi->writable = true;
1355 dsi->dont_invalidate = true;
1357 if (dsi->length == NULL_TREE)
1359 strinfo *chainsi;
1361 /* If string length of src is unknown, use delayed length
1362 computation. If string lenth of dst will be needed, it
1363 can be computed by transforming this strcpy call into
1364 stpcpy and subtracting dst from the return value. */
1366 /* Look for earlier strings whose length could be determined if
1367 this strcpy is turned into an stpcpy. */
1369 if (dsi->prev != 0 && (chainsi = verify_related_strinfos (dsi)) != NULL)
1371 for (; chainsi && chainsi != dsi; chainsi = get_strinfo (chainsi->next))
1373 /* When setting a stmt for delayed length computation
1374 prevent all strinfos through dsi from being
1375 invalidated. */
1376 chainsi = unshare_strinfo (chainsi);
1377 chainsi->stmt = stmt;
1378 chainsi->length = NULL_TREE;
1379 chainsi->endptr = NULL_TREE;
1380 chainsi->dont_invalidate = true;
1383 dsi->stmt = stmt;
1384 return;
1387 if (olddsi != NULL)
1389 tree adj = NULL_TREE;
1390 if (oldlen == NULL_TREE)
1392 else if (integer_zerop (oldlen))
1393 adj = srclen;
1394 else if (TREE_CODE (oldlen) == INTEGER_CST
1395 || TREE_CODE (srclen) == INTEGER_CST)
1396 adj = fold_build2_loc (loc, MINUS_EXPR,
1397 TREE_TYPE (srclen), srclen,
1398 fold_convert_loc (loc, TREE_TYPE (srclen),
1399 oldlen));
1400 if (adj != NULL_TREE)
1401 adjust_related_strinfos (loc, dsi, adj);
1402 else
1403 dsi->prev = 0;
1405 /* strcpy src may not overlap dst, so src doesn't need to be
1406 invalidated either. */
1407 if (si != NULL)
1408 si->dont_invalidate = true;
1410 fn = NULL_TREE;
1411 zsi = NULL;
1412 switch (bcode)
1414 case BUILT_IN_STRCPY:
1415 case BUILT_IN_STRCPY_CHKP:
1416 fn = builtin_decl_implicit (BUILT_IN_MEMCPY);
1417 if (lhs)
1418 ssa_ver_to_stridx[SSA_NAME_VERSION (lhs)] = didx;
1419 break;
1420 case BUILT_IN_STRCPY_CHK:
1421 case BUILT_IN_STRCPY_CHK_CHKP:
1422 fn = builtin_decl_explicit (BUILT_IN_MEMCPY_CHK);
1423 if (lhs)
1424 ssa_ver_to_stridx[SSA_NAME_VERSION (lhs)] = didx;
1425 break;
1426 case BUILT_IN_STPCPY:
1427 case BUILT_IN_STPCPY_CHKP:
1428 /* This would need adjustment of the lhs (subtract one),
1429 or detection that the trailing '\0' doesn't need to be
1430 written, if it will be immediately overwritten.
1431 fn = builtin_decl_explicit (BUILT_IN_MEMPCPY); */
1432 if (lhs)
1434 dsi->endptr = lhs;
1435 zsi = zero_length_string (lhs, dsi);
1437 break;
1438 case BUILT_IN_STPCPY_CHK:
1439 case BUILT_IN_STPCPY_CHK_CHKP:
1440 /* This would need adjustment of the lhs (subtract one),
1441 or detection that the trailing '\0' doesn't need to be
1442 written, if it will be immediately overwritten.
1443 fn = builtin_decl_explicit (BUILT_IN_MEMPCPY_CHK); */
1444 if (lhs)
1446 dsi->endptr = lhs;
1447 zsi = zero_length_string (lhs, dsi);
1449 break;
1450 default:
1451 gcc_unreachable ();
1453 if (zsi != NULL)
1454 zsi->dont_invalidate = true;
1456 if (fn == NULL_TREE)
1457 return;
1459 args = TYPE_ARG_TYPES (TREE_TYPE (fn));
1460 type = TREE_VALUE (TREE_CHAIN (TREE_CHAIN (args)));
1462 len = fold_convert_loc (loc, type, unshare_expr (srclen));
1463 len = fold_build2_loc (loc, PLUS_EXPR, type, len, build_int_cst (type, 1));
1464 len = force_gimple_operand_gsi (gsi, len, true, NULL_TREE, true,
1465 GSI_SAME_STMT);
1466 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1468 fprintf (dump_file, "Optimizing: ");
1469 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1471 if (with_bounds)
1473 fn = chkp_maybe_create_clone (fn)->decl;
1474 if (gimple_call_num_args (stmt) == 4)
1475 success = update_gimple_call (gsi, fn, 5, dst,
1476 gimple_call_arg (stmt, 1),
1477 src,
1478 gimple_call_arg (stmt, 3),
1479 len);
1480 else
1481 success = update_gimple_call (gsi, fn, 6, dst,
1482 gimple_call_arg (stmt, 1),
1483 src,
1484 gimple_call_arg (stmt, 3),
1485 len,
1486 gimple_call_arg (stmt, 4));
1488 else
1489 if (gimple_call_num_args (stmt) == 2)
1490 success = update_gimple_call (gsi, fn, 3, dst, src, len);
1491 else
1492 success = update_gimple_call (gsi, fn, 4, dst, src, len,
1493 gimple_call_arg (stmt, 2));
1494 if (success)
1496 stmt = gsi_stmt (*gsi);
1497 gimple_call_set_with_bounds (stmt, with_bounds);
1498 update_stmt (stmt);
1499 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1501 fprintf (dump_file, "into: ");
1502 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1504 /* Allow adjust_last_stmt to decrease this memcpy's size. */
1505 laststmt.stmt = stmt;
1506 laststmt.len = srclen;
1507 laststmt.stridx = dsi->idx;
1509 else if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1510 fprintf (dump_file, "not possible.\n");
1513 /* Handle a memcpy-like ({mem{,p}cpy,__mem{,p}cpy_chk}) call.
1514 If strlen of the second argument is known and length of the third argument
1515 is that plus one, strlen of the first argument is the same after this
1516 call. */
1518 static void
1519 handle_builtin_memcpy (enum built_in_function bcode, gimple_stmt_iterator *gsi)
1521 int idx, didx;
1522 tree src, dst, len, lhs, oldlen, newlen;
1523 gimple *stmt = gsi_stmt (*gsi);
1524 strinfo *si, *dsi, *olddsi;
1525 bool with_bounds = gimple_call_with_bounds_p (stmt);
1527 len = gimple_call_arg (stmt, with_bounds ? 4 : 2);
1528 src = gimple_call_arg (stmt, with_bounds ? 2 : 1);
1529 dst = gimple_call_arg (stmt, 0);
1530 idx = get_stridx (src);
1531 if (idx == 0)
1532 return;
1534 didx = get_stridx (dst);
1535 olddsi = NULL;
1536 if (didx > 0)
1537 olddsi = get_strinfo (didx);
1538 else if (didx < 0)
1539 return;
1541 if (olddsi != NULL
1542 && tree_fits_uhwi_p (len)
1543 && !integer_zerop (len))
1544 adjust_last_stmt (olddsi, stmt, false);
1546 if (idx > 0)
1548 gimple *def_stmt;
1550 /* Handle memcpy (x, y, l) where l is strlen (y) + 1. */
1551 si = get_strinfo (idx);
1552 if (si == NULL || si->length == NULL_TREE)
1553 return;
1554 if (TREE_CODE (len) != SSA_NAME)
1555 return;
1556 def_stmt = SSA_NAME_DEF_STMT (len);
1557 if (!is_gimple_assign (def_stmt)
1558 || gimple_assign_rhs_code (def_stmt) != PLUS_EXPR
1559 || gimple_assign_rhs1 (def_stmt) != si->length
1560 || !integer_onep (gimple_assign_rhs2 (def_stmt)))
1561 return;
1563 else
1565 si = NULL;
1566 /* Handle memcpy (x, "abcd", 5) or
1567 memcpy (x, "abc\0uvw", 7). */
1568 if (!tree_fits_uhwi_p (len)
1569 || tree_to_uhwi (len) <= (unsigned HOST_WIDE_INT) ~idx)
1570 return;
1573 if (olddsi != NULL && TREE_CODE (len) == SSA_NAME)
1574 adjust_last_stmt (olddsi, stmt, false);
1576 if (didx == 0)
1578 didx = new_stridx (dst);
1579 if (didx == 0)
1580 return;
1582 if (si != NULL)
1583 newlen = si->length;
1584 else
1585 newlen = build_int_cst (size_type_node, ~idx);
1586 oldlen = NULL_TREE;
1587 if (olddsi != NULL)
1589 dsi = unshare_strinfo (olddsi);
1590 oldlen = olddsi->length;
1591 dsi->length = newlen;
1592 /* Break the chain, so adjust_related_strinfo on later pointers in
1593 the chain won't adjust this one anymore. */
1594 dsi->next = 0;
1595 dsi->stmt = NULL;
1596 dsi->endptr = NULL_TREE;
1598 else
1600 dsi = new_strinfo (dst, didx, newlen);
1601 set_strinfo (didx, dsi);
1602 find_equal_ptrs (dst, didx);
1604 dsi->writable = true;
1605 dsi->dont_invalidate = true;
1606 if (olddsi != NULL)
1608 tree adj = NULL_TREE;
1609 location_t loc = gimple_location (stmt);
1610 if (oldlen == NULL_TREE)
1612 else if (integer_zerop (oldlen))
1613 adj = dsi->length;
1614 else if (TREE_CODE (oldlen) == INTEGER_CST
1615 || TREE_CODE (dsi->length) == INTEGER_CST)
1616 adj = fold_build2_loc (loc, MINUS_EXPR,
1617 TREE_TYPE (dsi->length), dsi->length,
1618 fold_convert_loc (loc, TREE_TYPE (dsi->length),
1619 oldlen));
1620 if (adj != NULL_TREE)
1621 adjust_related_strinfos (loc, dsi, adj);
1622 else
1623 dsi->prev = 0;
1625 /* memcpy src may not overlap dst, so src doesn't need to be
1626 invalidated either. */
1627 if (si != NULL)
1628 si->dont_invalidate = true;
1630 lhs = gimple_call_lhs (stmt);
1631 switch (bcode)
1633 case BUILT_IN_MEMCPY:
1634 case BUILT_IN_MEMCPY_CHK:
1635 case BUILT_IN_MEMCPY_CHKP:
1636 case BUILT_IN_MEMCPY_CHK_CHKP:
1637 /* Allow adjust_last_stmt to decrease this memcpy's size. */
1638 laststmt.stmt = stmt;
1639 laststmt.len = dsi->length;
1640 laststmt.stridx = dsi->idx;
1641 if (lhs)
1642 ssa_ver_to_stridx[SSA_NAME_VERSION (lhs)] = didx;
1643 break;
1644 case BUILT_IN_MEMPCPY:
1645 case BUILT_IN_MEMPCPY_CHK:
1646 case BUILT_IN_MEMPCPY_CHKP:
1647 case BUILT_IN_MEMPCPY_CHK_CHKP:
1648 break;
1649 default:
1650 gcc_unreachable ();
1654 /* Handle a strcat-like ({strcat,__strcat_chk}) call.
1655 If strlen of the second argument is known, strlen of the first argument
1656 is increased by the length of the second argument. Furthermore, attempt
1657 to convert it to memcpy/strcpy if the length of the first argument
1658 is known. */
1660 static void
1661 handle_builtin_strcat (enum built_in_function bcode, gimple_stmt_iterator *gsi)
1663 int idx, didx;
1664 tree src, dst, srclen, dstlen, len, lhs, args, type, fn, objsz, endptr;
1665 bool success;
1666 gimple *stmt = gsi_stmt (*gsi);
1667 strinfo *si, *dsi;
1668 location_t loc;
1669 bool with_bounds = gimple_call_with_bounds_p (stmt);
1671 src = gimple_call_arg (stmt, with_bounds ? 2 : 1);
1672 dst = gimple_call_arg (stmt, 0);
1673 lhs = gimple_call_lhs (stmt);
1675 didx = get_stridx (dst);
1676 if (didx < 0)
1677 return;
1679 dsi = NULL;
1680 if (didx > 0)
1681 dsi = get_strinfo (didx);
1682 if (dsi == NULL || get_string_length (dsi) == NULL_TREE)
1684 /* strcat (p, q) can be transformed into
1685 tmp = p + strlen (p); endptr = strpcpy (tmp, q);
1686 with length endptr - p if we need to compute the length
1687 later on. Don't do this transformation if we don't need
1688 it. */
1689 if (builtin_decl_implicit_p (BUILT_IN_STPCPY) && lhs == NULL_TREE)
1691 if (didx == 0)
1693 didx = new_stridx (dst);
1694 if (didx == 0)
1695 return;
1697 if (dsi == NULL)
1699 dsi = new_strinfo (dst, didx, NULL_TREE);
1700 set_strinfo (didx, dsi);
1701 find_equal_ptrs (dst, didx);
1703 else
1705 dsi = unshare_strinfo (dsi);
1706 dsi->length = NULL_TREE;
1707 dsi->next = 0;
1708 dsi->endptr = NULL_TREE;
1710 dsi->writable = true;
1711 dsi->stmt = stmt;
1712 dsi->dont_invalidate = true;
1714 return;
1717 srclen = NULL_TREE;
1718 si = NULL;
1719 idx = get_stridx (src);
1720 if (idx < 0)
1721 srclen = build_int_cst (size_type_node, ~idx);
1722 else if (idx > 0)
1724 si = get_strinfo (idx);
1725 if (si != NULL)
1726 srclen = get_string_length (si);
1729 loc = gimple_location (stmt);
1730 dstlen = dsi->length;
1731 endptr = dsi->endptr;
1733 dsi = unshare_strinfo (dsi);
1734 dsi->endptr = NULL_TREE;
1735 dsi->stmt = NULL;
1736 dsi->writable = true;
1738 if (srclen != NULL_TREE)
1740 dsi->length = fold_build2_loc (loc, PLUS_EXPR, TREE_TYPE (dsi->length),
1741 dsi->length, srclen);
1742 adjust_related_strinfos (loc, dsi, srclen);
1743 dsi->dont_invalidate = true;
1745 else
1747 dsi->length = NULL;
1748 if (lhs == NULL_TREE && builtin_decl_implicit_p (BUILT_IN_STPCPY))
1749 dsi->dont_invalidate = true;
1752 if (si != NULL)
1753 /* strcat src may not overlap dst, so src doesn't need to be
1754 invalidated either. */
1755 si->dont_invalidate = true;
1757 /* For now. Could remove the lhs from the call and add
1758 lhs = dst; afterwards. */
1759 if (lhs)
1760 return;
1762 fn = NULL_TREE;
1763 objsz = NULL_TREE;
1764 switch (bcode)
1766 case BUILT_IN_STRCAT:
1767 case BUILT_IN_STRCAT_CHKP:
1768 if (srclen != NULL_TREE)
1769 fn = builtin_decl_implicit (BUILT_IN_MEMCPY);
1770 else
1771 fn = builtin_decl_implicit (BUILT_IN_STRCPY);
1772 break;
1773 case BUILT_IN_STRCAT_CHK:
1774 case BUILT_IN_STRCAT_CHK_CHKP:
1775 if (srclen != NULL_TREE)
1776 fn = builtin_decl_explicit (BUILT_IN_MEMCPY_CHK);
1777 else
1778 fn = builtin_decl_explicit (BUILT_IN_STRCPY_CHK);
1779 objsz = gimple_call_arg (stmt, with_bounds ? 4 : 2);
1780 break;
1781 default:
1782 gcc_unreachable ();
1785 if (fn == NULL_TREE)
1786 return;
1788 len = NULL_TREE;
1789 if (srclen != NULL_TREE)
1791 args = TYPE_ARG_TYPES (TREE_TYPE (fn));
1792 type = TREE_VALUE (TREE_CHAIN (TREE_CHAIN (args)));
1794 len = fold_convert_loc (loc, type, unshare_expr (srclen));
1795 len = fold_build2_loc (loc, PLUS_EXPR, type, len,
1796 build_int_cst (type, 1));
1797 len = force_gimple_operand_gsi (gsi, len, true, NULL_TREE, true,
1798 GSI_SAME_STMT);
1800 if (endptr)
1801 dst = fold_convert_loc (loc, TREE_TYPE (dst), unshare_expr (endptr));
1802 else
1803 dst = fold_build2_loc (loc, POINTER_PLUS_EXPR,
1804 TREE_TYPE (dst), unshare_expr (dst),
1805 fold_convert_loc (loc, sizetype,
1806 unshare_expr (dstlen)));
1807 dst = force_gimple_operand_gsi (gsi, dst, true, NULL_TREE, true,
1808 GSI_SAME_STMT);
1809 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1811 fprintf (dump_file, "Optimizing: ");
1812 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1814 if (with_bounds)
1816 fn = chkp_maybe_create_clone (fn)->decl;
1817 if (srclen != NULL_TREE)
1818 success = update_gimple_call (gsi, fn, 5 + (objsz != NULL_TREE),
1819 dst,
1820 gimple_call_arg (stmt, 1),
1821 src,
1822 gimple_call_arg (stmt, 3),
1823 len, objsz);
1824 else
1825 success = update_gimple_call (gsi, fn, 4 + (objsz != NULL_TREE),
1826 dst,
1827 gimple_call_arg (stmt, 1),
1828 src,
1829 gimple_call_arg (stmt, 3),
1830 objsz);
1832 else
1833 if (srclen != NULL_TREE)
1834 success = update_gimple_call (gsi, fn, 3 + (objsz != NULL_TREE),
1835 dst, src, len, objsz);
1836 else
1837 success = update_gimple_call (gsi, fn, 2 + (objsz != NULL_TREE),
1838 dst, src, objsz);
1839 if (success)
1841 stmt = gsi_stmt (*gsi);
1842 gimple_call_set_with_bounds (stmt, with_bounds);
1843 update_stmt (stmt);
1844 if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1846 fprintf (dump_file, "into: ");
1847 print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1849 /* If srclen == NULL, note that current string length can be
1850 computed by transforming this strcpy into stpcpy. */
1851 if (srclen == NULL_TREE && dsi->dont_invalidate)
1852 dsi->stmt = stmt;
1853 adjust_last_stmt (dsi, stmt, true);
1854 if (srclen != NULL_TREE)
1856 laststmt.stmt = stmt;
1857 laststmt.len = srclen;
1858 laststmt.stridx = dsi->idx;
1861 else if (dump_file && (dump_flags & TDF_DETAILS) != 0)
1862 fprintf (dump_file, "not possible.\n");
1865 /* Handle a call to malloc or calloc. */
1867 static void
1868 handle_builtin_malloc (enum built_in_function bcode, gimple_stmt_iterator *gsi)
1870 gimple *stmt = gsi_stmt (*gsi);
1871 tree lhs = gimple_call_lhs (stmt);
1872 if (lhs == NULL_TREE)
1873 return;
1875 gcc_assert (get_stridx (lhs) == 0);
1876 int idx = new_stridx (lhs);
1877 tree length = NULL_TREE;
1878 if (bcode == BUILT_IN_CALLOC)
1879 length = build_int_cst (size_type_node, 0);
1880 strinfo *si = new_strinfo (lhs, idx, length);
1881 if (bcode == BUILT_IN_CALLOC)
1882 si->endptr = lhs;
1883 set_strinfo (idx, si);
1884 si->writable = true;
1885 si->stmt = stmt;
1886 si->dont_invalidate = true;
1889 /* Handle a call to memset.
1890 After a call to calloc, memset(,0,) is unnecessary.
1891 memset(malloc(n),0,n) is calloc(n,1). */
1893 static bool
1894 handle_builtin_memset (gimple_stmt_iterator *gsi)
1896 gimple *stmt2 = gsi_stmt (*gsi);
1897 if (!integer_zerop (gimple_call_arg (stmt2, 1)))
1898 return true;
1899 tree ptr = gimple_call_arg (stmt2, 0);
1900 int idx1 = get_stridx (ptr);
1901 if (idx1 <= 0)
1902 return true;
1903 strinfo *si1 = get_strinfo (idx1);
1904 if (!si1)
1905 return true;
1906 gimple *stmt1 = si1->stmt;
1907 if (!stmt1 || !is_gimple_call (stmt1))
1908 return true;
1909 tree callee1 = gimple_call_fndecl (stmt1);
1910 if (!valid_builtin_call (stmt1))
1911 return true;
1912 enum built_in_function code1 = DECL_FUNCTION_CODE (callee1);
1913 tree size = gimple_call_arg (stmt2, 2);
1914 if (code1 == BUILT_IN_CALLOC)
1915 /* Not touching stmt1 */ ;
1916 else if (code1 == BUILT_IN_MALLOC
1917 && operand_equal_p (gimple_call_arg (stmt1, 0), size, 0))
1919 gimple_stmt_iterator gsi1 = gsi_for_stmt (stmt1);
1920 update_gimple_call (&gsi1, builtin_decl_implicit (BUILT_IN_CALLOC), 2,
1921 size, build_one_cst (size_type_node));
1922 si1->length = build_int_cst (size_type_node, 0);
1923 si1->stmt = gsi_stmt (gsi1);
1925 else
1926 return true;
1927 tree lhs = gimple_call_lhs (stmt2);
1928 unlink_stmt_vdef (stmt2);
1929 if (lhs)
1931 gimple *assign = gimple_build_assign (lhs, ptr);
1932 gsi_replace (gsi, assign, false);
1934 else
1936 gsi_remove (gsi, true);
1937 release_defs (stmt2);
1940 return false;
1943 /* Handle a call to memcmp. We try to handle small comparisons by
1944 converting them to load and compare, and replacing the call to memcmp
1945 with a __builtin_memcmp_eq call where possible. */
1947 static bool
1948 handle_builtin_memcmp (gimple_stmt_iterator *gsi)
1950 gcall *stmt2 = as_a <gcall *> (gsi_stmt (*gsi));
1951 tree res = gimple_call_lhs (stmt2);
1952 tree arg1 = gimple_call_arg (stmt2, 0);
1953 tree arg2 = gimple_call_arg (stmt2, 1);
1954 tree len = gimple_call_arg (stmt2, 2);
1955 unsigned HOST_WIDE_INT leni;
1956 use_operand_p use_p;
1957 imm_use_iterator iter;
1959 if (!res)
1960 return true;
1962 FOR_EACH_IMM_USE_FAST (use_p, iter, res)
1964 gimple *ustmt = USE_STMT (use_p);
1966 if (is_gimple_debug (ustmt))
1967 continue;
1968 if (gimple_code (ustmt) == GIMPLE_ASSIGN)
1970 gassign *asgn = as_a <gassign *> (ustmt);
1971 tree_code code = gimple_assign_rhs_code (asgn);
1972 if ((code != EQ_EXPR && code != NE_EXPR)
1973 || !integer_zerop (gimple_assign_rhs2 (asgn)))
1974 return true;
1976 else if (gimple_code (ustmt) == GIMPLE_COND)
1978 tree_code code = gimple_cond_code (ustmt);
1979 if ((code != EQ_EXPR && code != NE_EXPR)
1980 || !integer_zerop (gimple_cond_rhs (ustmt)))
1981 return true;
1983 else
1984 return true;
1987 if (tree_fits_uhwi_p (len)
1988 && (leni = tree_to_uhwi (len)) <= GET_MODE_SIZE (word_mode)
1989 && pow2p_hwi (leni))
1991 leni *= CHAR_TYPE_SIZE;
1992 unsigned align1 = get_pointer_alignment (arg1);
1993 unsigned align2 = get_pointer_alignment (arg2);
1994 unsigned align = MIN (align1, align2);
1995 machine_mode mode = mode_for_size (leni, MODE_INT, 1);
1996 if (mode != BLKmode
1997 && (align >= leni || !SLOW_UNALIGNED_ACCESS (mode, align)))
1999 location_t loc = gimple_location (stmt2);
2000 tree type, off;
2001 type = build_nonstandard_integer_type (leni, 1);
2002 gcc_assert (GET_MODE_BITSIZE (TYPE_MODE (type)) == leni);
2003 tree ptrtype = build_pointer_type_for_mode (char_type_node,
2004 ptr_mode, true);
2005 off = build_int_cst (ptrtype, 0);
2006 arg1 = build2_loc (loc, MEM_REF, type, arg1, off);
2007 arg2 = build2_loc (loc, MEM_REF, type, arg2, off);
2008 tree tem1 = fold_const_aggregate_ref (arg1);
2009 if (tem1)
2010 arg1 = tem1;
2011 tree tem2 = fold_const_aggregate_ref (arg2);
2012 if (tem2)
2013 arg2 = tem2;
2014 res = fold_convert_loc (loc, TREE_TYPE (res),
2015 fold_build2_loc (loc, NE_EXPR,
2016 boolean_type_node,
2017 arg1, arg2));
2018 gimplify_and_update_call_from_tree (gsi, res);
2019 return false;
2023 gimple_call_set_fndecl (stmt2, builtin_decl_explicit (BUILT_IN_MEMCMP_EQ));
2024 return false;
2027 /* Handle a POINTER_PLUS_EXPR statement.
2028 For p = "abcd" + 2; compute associated length, or if
2029 p = q + off is pointing to a '\0' character of a string, call
2030 zero_length_string on it. */
2032 static void
2033 handle_pointer_plus (gimple_stmt_iterator *gsi)
2035 gimple *stmt = gsi_stmt (*gsi);
2036 tree lhs = gimple_assign_lhs (stmt), off;
2037 int idx = get_stridx (gimple_assign_rhs1 (stmt));
2038 strinfo *si, *zsi;
2040 if (idx == 0)
2041 return;
2043 if (idx < 0)
2045 tree off = gimple_assign_rhs2 (stmt);
2046 if (tree_fits_uhwi_p (off)
2047 && tree_to_uhwi (off) <= (unsigned HOST_WIDE_INT) ~idx)
2048 ssa_ver_to_stridx[SSA_NAME_VERSION (lhs)]
2049 = ~(~idx - (int) tree_to_uhwi (off));
2050 return;
2053 si = get_strinfo (idx);
2054 if (si == NULL || si->length == NULL_TREE)
2055 return;
2057 off = gimple_assign_rhs2 (stmt);
2058 zsi = NULL;
2059 if (operand_equal_p (si->length, off, 0))
2060 zsi = zero_length_string (lhs, si);
2061 else if (TREE_CODE (off) == SSA_NAME)
2063 gimple *def_stmt = SSA_NAME_DEF_STMT (off);
2064 if (gimple_assign_single_p (def_stmt)
2065 && operand_equal_p (si->length, gimple_assign_rhs1 (def_stmt), 0))
2066 zsi = zero_length_string (lhs, si);
2068 if (zsi != NULL
2069 && si->endptr != NULL_TREE
2070 && si->endptr != lhs
2071 && TREE_CODE (si->endptr) == SSA_NAME)
2073 enum tree_code rhs_code
2074 = useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE (si->endptr))
2075 ? SSA_NAME : NOP_EXPR;
2076 gimple_assign_set_rhs_with_ops (gsi, rhs_code, si->endptr);
2077 gcc_assert (gsi_stmt (*gsi) == stmt);
2078 update_stmt (stmt);
2082 /* Handle a single character store. */
2084 static bool
2085 handle_char_store (gimple_stmt_iterator *gsi)
2087 int idx = -1;
2088 strinfo *si = NULL;
2089 gimple *stmt = gsi_stmt (*gsi);
2090 tree ssaname = NULL_TREE, lhs = gimple_assign_lhs (stmt);
2092 if (TREE_CODE (lhs) == MEM_REF
2093 && TREE_CODE (TREE_OPERAND (lhs, 0)) == SSA_NAME)
2095 if (integer_zerop (TREE_OPERAND (lhs, 1)))
2097 ssaname = TREE_OPERAND (lhs, 0);
2098 idx = get_stridx (ssaname);
2101 else
2102 idx = get_addr_stridx (lhs, NULL_TREE);
2104 if (idx > 0)
2106 si = get_strinfo (idx);
2107 if (si != NULL && si->length != NULL_TREE && integer_zerop (si->length))
2109 if (initializer_zerop (gimple_assign_rhs1 (stmt)))
2111 /* When storing '\0', the store can be removed
2112 if we know it has been stored in the current function. */
2113 if (!stmt_could_throw_p (stmt) && si->writable)
2115 unlink_stmt_vdef (stmt);
2116 release_defs (stmt);
2117 gsi_remove (gsi, true);
2118 return false;
2120 else
2122 si->writable = true;
2123 gsi_next (gsi);
2124 return false;
2127 else
2128 /* Otherwise this statement overwrites the '\0' with
2129 something, if the previous stmt was a memcpy,
2130 its length may be decreased. */
2131 adjust_last_stmt (si, stmt, false);
2133 else if (si != NULL && integer_zerop (gimple_assign_rhs1 (stmt)))
2135 si = unshare_strinfo (si);
2136 si->length = build_int_cst (size_type_node, 0);
2137 si->endptr = NULL;
2138 si->prev = 0;
2139 si->next = 0;
2140 si->stmt = NULL;
2141 si->first = 0;
2142 si->writable = true;
2143 if (ssaname && !SSA_NAME_OCCURS_IN_ABNORMAL_PHI (ssaname))
2144 si->endptr = ssaname;
2145 si->dont_invalidate = true;
2147 /* If si->length is non-zero constant, we aren't overwriting '\0',
2148 and if we aren't storing '\0', we know that the length of the
2149 string and any other zero terminated string in memory remains
2150 the same. In that case we move to the next gimple statement and
2151 return to signal the caller that it shouldn't invalidate anything.
2153 This is benefical for cases like:
2155 char p[20];
2156 void foo (char *q)
2158 strcpy (p, "foobar");
2159 size_t len = strlen (p); // This can be optimized into 6
2160 size_t len2 = strlen (q); // This has to be computed
2161 p[0] = 'X';
2162 size_t len3 = strlen (p); // This can be optimized into 6
2163 size_t len4 = strlen (q); // This can be optimized into len2
2164 bar (len, len2, len3, len4);
2167 else if (si != NULL && si->length != NULL_TREE
2168 && TREE_CODE (si->length) == INTEGER_CST
2169 && integer_nonzerop (gimple_assign_rhs1 (stmt)))
2171 gsi_next (gsi);
2172 return false;
2175 else if (idx == 0 && initializer_zerop (gimple_assign_rhs1 (stmt)))
2177 if (ssaname)
2179 si = zero_length_string (ssaname, NULL);
2180 if (si != NULL)
2181 si->dont_invalidate = true;
2183 else
2185 int idx = new_addr_stridx (lhs);
2186 if (idx != 0)
2188 si = new_strinfo (build_fold_addr_expr (lhs), idx,
2189 build_int_cst (size_type_node, 0));
2190 set_strinfo (idx, si);
2191 si->dont_invalidate = true;
2194 if (si != NULL)
2195 si->writable = true;
2197 else if (idx == 0
2198 && TREE_CODE (gimple_assign_rhs1 (stmt)) == STRING_CST
2199 && ssaname == NULL_TREE
2200 && TREE_CODE (TREE_TYPE (lhs)) == ARRAY_TYPE)
2202 size_t l = strlen (TREE_STRING_POINTER (gimple_assign_rhs1 (stmt)));
2203 HOST_WIDE_INT a = int_size_in_bytes (TREE_TYPE (lhs));
2204 if (a > 0 && (unsigned HOST_WIDE_INT) a > l)
2206 int idx = new_addr_stridx (lhs);
2207 if (idx != 0)
2209 si = new_strinfo (build_fold_addr_expr (lhs), idx,
2210 build_int_cst (size_type_node, l));
2211 set_strinfo (idx, si);
2212 si->dont_invalidate = true;
2217 if (si != NULL && initializer_zerop (gimple_assign_rhs1 (stmt)))
2219 /* Allow adjust_last_stmt to remove it if the stored '\0'
2220 is immediately overwritten. */
2221 laststmt.stmt = stmt;
2222 laststmt.len = build_int_cst (size_type_node, 1);
2223 laststmt.stridx = si->idx;
2225 return true;
2228 /* Try to fold strstr (s, t) eq/ne s to strncmp (s, t, strlen (t)) eq/ne 0. */
2230 static void
2231 fold_strstr_to_strncmp (tree rhs1, tree rhs2, gimple *stmt)
2233 if (TREE_CODE (rhs1) != SSA_NAME
2234 || TREE_CODE (rhs2) != SSA_NAME)
2235 return;
2237 gimple *call_stmt = NULL;
2238 for (int pass = 0; pass < 2; pass++)
2240 gimple *g = SSA_NAME_DEF_STMT (rhs1);
2241 if (gimple_call_builtin_p (g, BUILT_IN_STRSTR)
2242 && has_single_use (rhs1)
2243 && gimple_call_arg (g, 0) == rhs2)
2245 call_stmt = g;
2246 break;
2248 std::swap (rhs1, rhs2);
2251 if (call_stmt)
2253 tree arg0 = gimple_call_arg (call_stmt, 0);
2255 if (arg0 == rhs2)
2257 tree arg1 = gimple_call_arg (call_stmt, 1);
2258 tree arg1_len = NULL_TREE;
2259 int idx = get_stridx (arg1);
2261 if (idx)
2263 if (idx < 0)
2264 arg1_len = build_int_cst (size_type_node, ~idx);
2265 else
2267 strinfo *si = get_strinfo (idx);
2268 if (si)
2269 arg1_len = get_string_length (si);
2273 if (arg1_len != NULL_TREE)
2275 gimple_stmt_iterator gsi = gsi_for_stmt (call_stmt);
2276 tree strncmp_decl = builtin_decl_explicit (BUILT_IN_STRNCMP);
2277 gcall *strncmp_call = gimple_build_call (strncmp_decl, 3,
2278 arg0, arg1, arg1_len);
2279 tree strncmp_lhs = make_ssa_name (integer_type_node);
2280 gimple_set_vuse (strncmp_call, gimple_vuse (call_stmt));
2281 gimple_call_set_lhs (strncmp_call, strncmp_lhs);
2282 gsi_remove (&gsi, true);
2283 gsi_insert_before (&gsi, strncmp_call, GSI_SAME_STMT);
2284 tree zero = build_zero_cst (TREE_TYPE (strncmp_lhs));
2286 if (is_gimple_assign (stmt))
2288 if (gimple_assign_rhs_code (stmt) == COND_EXPR)
2290 tree cond = gimple_assign_rhs1 (stmt);
2291 TREE_OPERAND (cond, 0) = strncmp_lhs;
2292 TREE_OPERAND (cond, 1) = zero;
2294 else
2296 gimple_assign_set_rhs1 (stmt, strncmp_lhs);
2297 gimple_assign_set_rhs2 (stmt, zero);
2300 else
2302 gcond *cond = as_a<gcond *> (stmt);
2303 gimple_cond_set_lhs (cond, strncmp_lhs);
2304 gimple_cond_set_rhs (cond, zero);
2306 update_stmt (stmt);
2312 /* Attempt to optimize a single statement at *GSI using string length
2313 knowledge. */
2315 static bool
2316 strlen_optimize_stmt (gimple_stmt_iterator *gsi)
2318 gimple *stmt = gsi_stmt (*gsi);
2320 if (is_gimple_call (stmt))
2322 tree callee = gimple_call_fndecl (stmt);
2323 if (valid_builtin_call (stmt))
2324 switch (DECL_FUNCTION_CODE (callee))
2326 case BUILT_IN_STRLEN:
2327 case BUILT_IN_STRLEN_CHKP:
2328 handle_builtin_strlen (gsi);
2329 break;
2330 case BUILT_IN_STRCHR:
2331 case BUILT_IN_STRCHR_CHKP:
2332 handle_builtin_strchr (gsi);
2333 break;
2334 case BUILT_IN_STRCPY:
2335 case BUILT_IN_STRCPY_CHK:
2336 case BUILT_IN_STPCPY:
2337 case BUILT_IN_STPCPY_CHK:
2338 case BUILT_IN_STRCPY_CHKP:
2339 case BUILT_IN_STRCPY_CHK_CHKP:
2340 case BUILT_IN_STPCPY_CHKP:
2341 case BUILT_IN_STPCPY_CHK_CHKP:
2342 handle_builtin_strcpy (DECL_FUNCTION_CODE (callee), gsi);
2343 break;
2344 case BUILT_IN_MEMCPY:
2345 case BUILT_IN_MEMCPY_CHK:
2346 case BUILT_IN_MEMPCPY:
2347 case BUILT_IN_MEMPCPY_CHK:
2348 case BUILT_IN_MEMCPY_CHKP:
2349 case BUILT_IN_MEMCPY_CHK_CHKP:
2350 case BUILT_IN_MEMPCPY_CHKP:
2351 case BUILT_IN_MEMPCPY_CHK_CHKP:
2352 handle_builtin_memcpy (DECL_FUNCTION_CODE (callee), gsi);
2353 break;
2354 case BUILT_IN_STRCAT:
2355 case BUILT_IN_STRCAT_CHK:
2356 case BUILT_IN_STRCAT_CHKP:
2357 case BUILT_IN_STRCAT_CHK_CHKP:
2358 handle_builtin_strcat (DECL_FUNCTION_CODE (callee), gsi);
2359 break;
2360 case BUILT_IN_MALLOC:
2361 case BUILT_IN_CALLOC:
2362 handle_builtin_malloc (DECL_FUNCTION_CODE (callee), gsi);
2363 break;
2364 case BUILT_IN_MEMSET:
2365 if (!handle_builtin_memset (gsi))
2366 return false;
2367 break;
2368 case BUILT_IN_MEMCMP:
2369 if (!handle_builtin_memcmp (gsi))
2370 return false;
2371 break;
2372 default:
2373 break;
2376 else if (is_gimple_assign (stmt) && !gimple_clobber_p (stmt))
2378 tree lhs = gimple_assign_lhs (stmt);
2380 if (TREE_CODE (lhs) == SSA_NAME && POINTER_TYPE_P (TREE_TYPE (lhs)))
2382 if (gimple_assign_single_p (stmt)
2383 || (gimple_assign_cast_p (stmt)
2384 && POINTER_TYPE_P (TREE_TYPE (gimple_assign_rhs1 (stmt)))))
2386 int idx = get_stridx (gimple_assign_rhs1 (stmt));
2387 ssa_ver_to_stridx[SSA_NAME_VERSION (lhs)] = idx;
2389 else if (gimple_assign_rhs_code (stmt) == POINTER_PLUS_EXPR)
2390 handle_pointer_plus (gsi);
2392 else if (TREE_CODE (lhs) == SSA_NAME && INTEGRAL_TYPE_P (TREE_TYPE (lhs)))
2394 enum tree_code code = gimple_assign_rhs_code (stmt);
2395 if (code == COND_EXPR)
2397 tree cond = gimple_assign_rhs1 (stmt);
2398 enum tree_code cond_code = TREE_CODE (cond);
2400 if (cond_code == EQ_EXPR || cond_code == NE_EXPR)
2401 fold_strstr_to_strncmp (TREE_OPERAND (cond, 0),
2402 TREE_OPERAND (cond, 1), stmt);
2404 else if (code == EQ_EXPR || code == NE_EXPR)
2405 fold_strstr_to_strncmp (gimple_assign_rhs1 (stmt),
2406 gimple_assign_rhs2 (stmt), stmt);
2408 else if (TREE_CODE (lhs) != SSA_NAME && !TREE_SIDE_EFFECTS (lhs))
2410 tree type = TREE_TYPE (lhs);
2411 if (TREE_CODE (type) == ARRAY_TYPE)
2412 type = TREE_TYPE (type);
2413 if (TREE_CODE (type) == INTEGER_TYPE
2414 && TYPE_MODE (type) == TYPE_MODE (char_type_node)
2415 && TYPE_PRECISION (type) == TYPE_PRECISION (char_type_node))
2417 if (! handle_char_store (gsi))
2418 return false;
2422 else if (gcond *cond = dyn_cast<gcond *> (stmt))
2424 enum tree_code code = gimple_cond_code (cond);
2425 if (code == EQ_EXPR || code == NE_EXPR)
2426 fold_strstr_to_strncmp (gimple_cond_lhs (stmt),
2427 gimple_cond_rhs (stmt), stmt);
2430 if (gimple_vdef (stmt))
2431 maybe_invalidate (stmt);
2432 return true;
2435 /* Recursively call maybe_invalidate on stmts that might be executed
2436 in between dombb and current bb and that contain a vdef. Stop when
2437 *count stmts are inspected, or if the whole strinfo vector has
2438 been invalidated. */
2440 static void
2441 do_invalidate (basic_block dombb, gimple *phi, bitmap visited, int *count)
2443 unsigned int i, n = gimple_phi_num_args (phi);
2445 for (i = 0; i < n; i++)
2447 tree vuse = gimple_phi_arg_def (phi, i);
2448 gimple *stmt = SSA_NAME_DEF_STMT (vuse);
2449 basic_block bb = gimple_bb (stmt);
2450 if (bb == NULL
2451 || bb == dombb
2452 || !bitmap_set_bit (visited, bb->index)
2453 || !dominated_by_p (CDI_DOMINATORS, bb, dombb))
2454 continue;
2455 while (1)
2457 if (gimple_code (stmt) == GIMPLE_PHI)
2459 do_invalidate (dombb, stmt, visited, count);
2460 if (*count == 0)
2461 return;
2462 break;
2464 if (--*count == 0)
2465 return;
2466 if (!maybe_invalidate (stmt))
2468 *count = 0;
2469 return;
2471 vuse = gimple_vuse (stmt);
2472 stmt = SSA_NAME_DEF_STMT (vuse);
2473 if (gimple_bb (stmt) != bb)
2475 bb = gimple_bb (stmt);
2476 if (bb == NULL
2477 || bb == dombb
2478 || !bitmap_set_bit (visited, bb->index)
2479 || !dominated_by_p (CDI_DOMINATORS, bb, dombb))
2480 break;
2486 class strlen_dom_walker : public dom_walker
2488 public:
2489 strlen_dom_walker (cdi_direction direction) : dom_walker (direction) {}
2491 virtual edge before_dom_children (basic_block);
2492 virtual void after_dom_children (basic_block);
2495 /* Callback for walk_dominator_tree. Attempt to optimize various
2496 string ops by remembering string lengths pointed by pointer SSA_NAMEs. */
2498 edge
2499 strlen_dom_walker::before_dom_children (basic_block bb)
2501 basic_block dombb = get_immediate_dominator (CDI_DOMINATORS, bb);
2503 if (dombb == NULL)
2504 stridx_to_strinfo = NULL;
2505 else
2507 stridx_to_strinfo = ((vec<strinfo *, va_heap, vl_embed> *) dombb->aux);
2508 if (stridx_to_strinfo)
2510 for (gphi_iterator gsi = gsi_start_phis (bb); !gsi_end_p (gsi);
2511 gsi_next (&gsi))
2513 gphi *phi = gsi.phi ();
2514 if (virtual_operand_p (gimple_phi_result (phi)))
2516 bitmap visited = BITMAP_ALLOC (NULL);
2517 int count_vdef = 100;
2518 do_invalidate (dombb, phi, visited, &count_vdef);
2519 BITMAP_FREE (visited);
2520 if (count_vdef == 0)
2522 /* If there were too many vdefs in between immediate
2523 dominator and current bb, invalidate everything.
2524 If stridx_to_strinfo has been unshared, we need
2525 to free it, otherwise just set it to NULL. */
2526 if (!strinfo_shared ())
2528 unsigned int i;
2529 strinfo *si;
2531 for (i = 1;
2532 vec_safe_iterate (stridx_to_strinfo, i, &si);
2533 ++i)
2535 free_strinfo (si);
2536 (*stridx_to_strinfo)[i] = NULL;
2539 else
2540 stridx_to_strinfo = NULL;
2542 break;
2548 /* If all PHI arguments have the same string index, the PHI result
2549 has it as well. */
2550 for (gphi_iterator gsi = gsi_start_phis (bb); !gsi_end_p (gsi);
2551 gsi_next (&gsi))
2553 gphi *phi = gsi.phi ();
2554 tree result = gimple_phi_result (phi);
2555 if (!virtual_operand_p (result) && POINTER_TYPE_P (TREE_TYPE (result)))
2557 int idx = get_stridx (gimple_phi_arg_def (phi, 0));
2558 if (idx != 0)
2560 unsigned int i, n = gimple_phi_num_args (phi);
2561 for (i = 1; i < n; i++)
2562 if (idx != get_stridx (gimple_phi_arg_def (phi, i)))
2563 break;
2564 if (i == n)
2565 ssa_ver_to_stridx[SSA_NAME_VERSION (result)] = idx;
2570 /* Attempt to optimize individual statements. */
2571 for (gimple_stmt_iterator gsi = gsi_start_bb (bb); !gsi_end_p (gsi); )
2572 if (strlen_optimize_stmt (&gsi))
2573 gsi_next (&gsi);
2575 bb->aux = stridx_to_strinfo;
2576 if (vec_safe_length (stridx_to_strinfo) && !strinfo_shared ())
2577 (*stridx_to_strinfo)[0] = (strinfo *) bb;
2578 return NULL;
2581 /* Callback for walk_dominator_tree. Free strinfo vector if it is
2582 owned by the current bb, clear bb->aux. */
2584 void
2585 strlen_dom_walker::after_dom_children (basic_block bb)
2587 if (bb->aux)
2589 stridx_to_strinfo = ((vec<strinfo *, va_heap, vl_embed> *) bb->aux);
2590 if (vec_safe_length (stridx_to_strinfo)
2591 && (*stridx_to_strinfo)[0] == (strinfo *) bb)
2593 unsigned int i;
2594 strinfo *si;
2596 for (i = 1; vec_safe_iterate (stridx_to_strinfo, i, &si); ++i)
2597 free_strinfo (si);
2598 vec_free (stridx_to_strinfo);
2600 bb->aux = NULL;
2604 /* Main entry point. */
2606 namespace {
2608 const pass_data pass_data_strlen =
2610 GIMPLE_PASS, /* type */
2611 "strlen", /* name */
2612 OPTGROUP_NONE, /* optinfo_flags */
2613 TV_TREE_STRLEN, /* tv_id */
2614 ( PROP_cfg | PROP_ssa ), /* properties_required */
2615 0, /* properties_provided */
2616 0, /* properties_destroyed */
2617 0, /* todo_flags_start */
2618 0, /* todo_flags_finish */
2621 class pass_strlen : public gimple_opt_pass
2623 public:
2624 pass_strlen (gcc::context *ctxt)
2625 : gimple_opt_pass (pass_data_strlen, ctxt)
2628 /* opt_pass methods: */
2629 virtual bool gate (function *) { return flag_optimize_strlen != 0; }
2630 virtual unsigned int execute (function *);
2632 }; // class pass_strlen
2634 unsigned int
2635 pass_strlen::execute (function *fun)
2637 ssa_ver_to_stridx.safe_grow_cleared (num_ssa_names);
2638 max_stridx = 1;
2640 calculate_dominance_info (CDI_DOMINATORS);
2642 /* String length optimization is implemented as a walk of the dominator
2643 tree and a forward walk of statements within each block. */
2644 strlen_dom_walker (CDI_DOMINATORS).walk (fun->cfg->x_entry_block_ptr);
2646 ssa_ver_to_stridx.release ();
2647 strinfo_pool.release ();
2648 if (decl_to_stridxlist_htab)
2650 obstack_free (&stridx_obstack, NULL);
2651 delete decl_to_stridxlist_htab;
2652 decl_to_stridxlist_htab = NULL;
2654 laststmt.stmt = NULL;
2655 laststmt.len = NULL_TREE;
2656 laststmt.stridx = 0;
2658 return 0;
2661 } // anon namespace
2663 gimple_opt_pass *
2664 make_pass_strlen (gcc::context *ctxt)
2666 return new pass_strlen (ctxt);