Merge trunk version 211672 into gupc branch.
[official-gcc.git] / gcc / trans-mem.c
blobb728d743d6e4a2a48b277a18d38d1ba069b39952
1 /* Passes for transactional memory support.
2 Copyright (C) 2008-2014 Free Software Foundation, Inc.
4 This file is part of GCC.
6 GCC is free software; you can redistribute it and/or modify it under
7 the terms of the GNU General Public License as published by the Free
8 Software Foundation; either version 3, or (at your option) any later
9 version.
11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 for more details.
16 You should have received a copy of the GNU General Public License
17 along with GCC; see the file COPYING3. If not see
18 <http://www.gnu.org/licenses/>. */
20 #include "config.h"
21 #include "system.h"
22 #include "coretypes.h"
23 #include "hash-table.h"
24 #include "tree.h"
25 #include "basic-block.h"
26 #include "tree-ssa-alias.h"
27 #include "internal-fn.h"
28 #include "tree-eh.h"
29 #include "gimple-expr.h"
30 #include "is-a.h"
31 #include "gimple.h"
32 #include "calls.h"
33 #include "function.h"
34 #include "rtl.h"
35 #include "emit-rtl.h"
36 #include "gimplify.h"
37 #include "gimple-iterator.h"
38 #include "gimplify-me.h"
39 #include "gimple-walk.h"
40 #include "gimple-ssa.h"
41 #include "cgraph.h"
42 #include "tree-cfg.h"
43 #include "stringpool.h"
44 #include "tree-ssanames.h"
45 #include "tree-into-ssa.h"
46 #include "tree-pass.h"
47 #include "tree-inline.h"
48 #include "diagnostic-core.h"
49 #include "demangle.h"
50 #include "output.h"
51 #include "trans-mem.h"
52 #include "params.h"
53 #include "target.h"
54 #include "langhooks.h"
55 #include "gimple-pretty-print.h"
56 #include "cfgloop.h"
57 #include "tree-ssa-address.h"
58 #include "predict.h"
61 #define A_RUNINSTRUMENTEDCODE 0x0001
62 #define A_RUNUNINSTRUMENTEDCODE 0x0002
63 #define A_SAVELIVEVARIABLES 0x0004
64 #define A_RESTORELIVEVARIABLES 0x0008
65 #define A_ABORTTRANSACTION 0x0010
67 #define AR_USERABORT 0x0001
68 #define AR_USERRETRY 0x0002
69 #define AR_TMCONFLICT 0x0004
70 #define AR_EXCEPTIONBLOCKABORT 0x0008
71 #define AR_OUTERABORT 0x0010
73 #define MODE_SERIALIRREVOCABLE 0x0000
76 /* The representation of a transaction changes several times during the
77 lowering process. In the beginning, in the front-end we have the
78 GENERIC tree TRANSACTION_EXPR. For example,
80 __transaction {
81 local++;
82 if (++global == 10)
83 __tm_abort;
86 During initial gimplification (gimplify.c) the TRANSACTION_EXPR node is
87 trivially replaced with a GIMPLE_TRANSACTION node.
89 During pass_lower_tm, we examine the body of transactions looking
90 for aborts. Transactions that do not contain an abort may be
91 merged into an outer transaction. We also add a TRY-FINALLY node
92 to arrange for the transaction to be committed on any exit.
94 [??? Think about how this arrangement affects throw-with-commit
95 and throw-with-abort operations. In this case we want the TRY to
96 handle gotos, but not to catch any exceptions because the transaction
97 will already be closed.]
99 GIMPLE_TRANSACTION [label=NULL] {
100 try {
101 local = local + 1;
102 t0 = global;
103 t1 = t0 + 1;
104 global = t1;
105 if (t1 == 10)
106 __builtin___tm_abort ();
107 } finally {
108 __builtin___tm_commit ();
112 During pass_lower_eh, we create EH regions for the transactions,
113 intermixed with the regular EH stuff. This gives us a nice persistent
114 mapping (all the way through rtl) from transactional memory operation
115 back to the transaction, which allows us to get the abnormal edges
116 correct to model transaction aborts and restarts:
118 GIMPLE_TRANSACTION [label=over]
119 local = local + 1;
120 t0 = global;
121 t1 = t0 + 1;
122 global = t1;
123 if (t1 == 10)
124 __builtin___tm_abort ();
125 __builtin___tm_commit ();
126 over:
128 This is the end of all_lowering_passes, and so is what is present
129 during the IPA passes, and through all of the optimization passes.
131 During pass_ipa_tm, we examine all GIMPLE_TRANSACTION blocks in all
132 functions and mark functions for cloning.
134 At the end of gimple optimization, before exiting SSA form,
135 pass_tm_edges replaces statements that perform transactional
136 memory operations with the appropriate TM builtins, and swap
137 out function calls with their transactional clones. At this
138 point we introduce the abnormal transaction restart edges and
139 complete lowering of the GIMPLE_TRANSACTION node.
141 x = __builtin___tm_start (MAY_ABORT);
142 eh_label:
143 if (x & abort_transaction)
144 goto over;
145 local = local + 1;
146 t0 = __builtin___tm_load (global);
147 t1 = t0 + 1;
148 __builtin___tm_store (&global, t1);
149 if (t1 == 10)
150 __builtin___tm_abort ();
151 __builtin___tm_commit ();
152 over:
155 static void *expand_regions (struct tm_region *,
156 void *(*callback)(struct tm_region *, void *),
157 void *, bool);
160 /* Return the attributes we want to examine for X, or NULL if it's not
161 something we examine. We look at function types, but allow pointers
162 to function types and function decls and peek through. */
164 static tree
165 get_attrs_for (const_tree x)
167 switch (TREE_CODE (x))
169 case FUNCTION_DECL:
170 return TYPE_ATTRIBUTES (TREE_TYPE (x));
171 break;
173 default:
174 if (TYPE_P (x))
175 return NULL;
176 x = TREE_TYPE (x);
177 if (TREE_CODE (x) != POINTER_TYPE)
178 return NULL;
179 /* FALLTHRU */
181 case POINTER_TYPE:
182 x = TREE_TYPE (x);
183 if (TREE_CODE (x) != FUNCTION_TYPE && TREE_CODE (x) != METHOD_TYPE)
184 return NULL;
185 /* FALLTHRU */
187 case FUNCTION_TYPE:
188 case METHOD_TYPE:
189 return TYPE_ATTRIBUTES (x);
193 /* Return true if X has been marked TM_PURE. */
195 bool
196 is_tm_pure (const_tree x)
198 unsigned flags;
200 switch (TREE_CODE (x))
202 case FUNCTION_DECL:
203 case FUNCTION_TYPE:
204 case METHOD_TYPE:
205 break;
207 default:
208 if (TYPE_P (x))
209 return false;
210 x = TREE_TYPE (x);
211 if (TREE_CODE (x) != POINTER_TYPE)
212 return false;
213 /* FALLTHRU */
215 case POINTER_TYPE:
216 x = TREE_TYPE (x);
217 if (TREE_CODE (x) != FUNCTION_TYPE && TREE_CODE (x) != METHOD_TYPE)
218 return false;
219 break;
222 flags = flags_from_decl_or_type (x);
223 return (flags & ECF_TM_PURE) != 0;
226 /* Return true if X has been marked TM_IRREVOCABLE. */
228 static bool
229 is_tm_irrevocable (tree x)
231 tree attrs = get_attrs_for (x);
233 if (attrs && lookup_attribute ("transaction_unsafe", attrs))
234 return true;
236 /* A call to the irrevocable builtin is by definition,
237 irrevocable. */
238 if (TREE_CODE (x) == ADDR_EXPR)
239 x = TREE_OPERAND (x, 0);
240 if (TREE_CODE (x) == FUNCTION_DECL
241 && DECL_BUILT_IN_CLASS (x) == BUILT_IN_NORMAL
242 && DECL_FUNCTION_CODE (x) == BUILT_IN_TM_IRREVOCABLE)
243 return true;
245 return false;
248 /* Return true if X has been marked TM_SAFE. */
250 bool
251 is_tm_safe (const_tree x)
253 if (flag_tm)
255 tree attrs = get_attrs_for (x);
256 if (attrs)
258 if (lookup_attribute ("transaction_safe", attrs))
259 return true;
260 if (lookup_attribute ("transaction_may_cancel_outer", attrs))
261 return true;
264 return false;
267 /* Return true if CALL is const, or tm_pure. */
269 static bool
270 is_tm_pure_call (gimple call)
272 tree fn = gimple_call_fn (call);
274 if (TREE_CODE (fn) == ADDR_EXPR)
276 fn = TREE_OPERAND (fn, 0);
277 gcc_assert (TREE_CODE (fn) == FUNCTION_DECL);
279 else
280 fn = TREE_TYPE (fn);
282 return is_tm_pure (fn);
285 /* Return true if X has been marked TM_CALLABLE. */
287 static bool
288 is_tm_callable (tree x)
290 tree attrs = get_attrs_for (x);
291 if (attrs)
293 if (lookup_attribute ("transaction_callable", attrs))
294 return true;
295 if (lookup_attribute ("transaction_safe", attrs))
296 return true;
297 if (lookup_attribute ("transaction_may_cancel_outer", attrs))
298 return true;
300 return false;
303 /* Return true if X has been marked TRANSACTION_MAY_CANCEL_OUTER. */
305 bool
306 is_tm_may_cancel_outer (tree x)
308 tree attrs = get_attrs_for (x);
309 if (attrs)
310 return lookup_attribute ("transaction_may_cancel_outer", attrs) != NULL;
311 return false;
314 /* Return true for built in functions that "end" a transaction. */
316 bool
317 is_tm_ending_fndecl (tree fndecl)
319 if (DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
320 switch (DECL_FUNCTION_CODE (fndecl))
322 case BUILT_IN_TM_COMMIT:
323 case BUILT_IN_TM_COMMIT_EH:
324 case BUILT_IN_TM_ABORT:
325 case BUILT_IN_TM_IRREVOCABLE:
326 return true;
327 default:
328 break;
331 return false;
334 /* Return true if STMT is a built in function call that "ends" a
335 transaction. */
337 bool
338 is_tm_ending (gimple stmt)
340 tree fndecl;
342 if (gimple_code (stmt) != GIMPLE_CALL)
343 return false;
345 fndecl = gimple_call_fndecl (stmt);
346 return (fndecl != NULL_TREE
347 && is_tm_ending_fndecl (fndecl));
350 /* Return true if STMT is a TM load. */
352 static bool
353 is_tm_load (gimple stmt)
355 tree fndecl;
357 if (gimple_code (stmt) != GIMPLE_CALL)
358 return false;
360 fndecl = gimple_call_fndecl (stmt);
361 return (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL
362 && BUILTIN_TM_LOAD_P (DECL_FUNCTION_CODE (fndecl)));
365 /* Same as above, but for simple TM loads, that is, not the
366 after-write, after-read, etc optimized variants. */
368 static bool
369 is_tm_simple_load (gimple stmt)
371 tree fndecl;
373 if (gimple_code (stmt) != GIMPLE_CALL)
374 return false;
376 fndecl = gimple_call_fndecl (stmt);
377 if (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
379 enum built_in_function fcode = DECL_FUNCTION_CODE (fndecl);
380 return (fcode == BUILT_IN_TM_LOAD_1
381 || fcode == BUILT_IN_TM_LOAD_2
382 || fcode == BUILT_IN_TM_LOAD_4
383 || fcode == BUILT_IN_TM_LOAD_8
384 || fcode == BUILT_IN_TM_LOAD_FLOAT
385 || fcode == BUILT_IN_TM_LOAD_DOUBLE
386 || fcode == BUILT_IN_TM_LOAD_LDOUBLE
387 || fcode == BUILT_IN_TM_LOAD_M64
388 || fcode == BUILT_IN_TM_LOAD_M128
389 || fcode == BUILT_IN_TM_LOAD_M256);
391 return false;
394 /* Return true if STMT is a TM store. */
396 static bool
397 is_tm_store (gimple stmt)
399 tree fndecl;
401 if (gimple_code (stmt) != GIMPLE_CALL)
402 return false;
404 fndecl = gimple_call_fndecl (stmt);
405 return (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL
406 && BUILTIN_TM_STORE_P (DECL_FUNCTION_CODE (fndecl)));
409 /* Same as above, but for simple TM stores, that is, not the
410 after-write, after-read, etc optimized variants. */
412 static bool
413 is_tm_simple_store (gimple stmt)
415 tree fndecl;
417 if (gimple_code (stmt) != GIMPLE_CALL)
418 return false;
420 fndecl = gimple_call_fndecl (stmt);
421 if (fndecl && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
423 enum built_in_function fcode = DECL_FUNCTION_CODE (fndecl);
424 return (fcode == BUILT_IN_TM_STORE_1
425 || fcode == BUILT_IN_TM_STORE_2
426 || fcode == BUILT_IN_TM_STORE_4
427 || fcode == BUILT_IN_TM_STORE_8
428 || fcode == BUILT_IN_TM_STORE_FLOAT
429 || fcode == BUILT_IN_TM_STORE_DOUBLE
430 || fcode == BUILT_IN_TM_STORE_LDOUBLE
431 || fcode == BUILT_IN_TM_STORE_M64
432 || fcode == BUILT_IN_TM_STORE_M128
433 || fcode == BUILT_IN_TM_STORE_M256);
435 return false;
438 /* Return true if FNDECL is BUILT_IN_TM_ABORT. */
440 static bool
441 is_tm_abort (tree fndecl)
443 return (fndecl
444 && DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL
445 && DECL_FUNCTION_CODE (fndecl) == BUILT_IN_TM_ABORT);
448 /* Build a GENERIC tree for a user abort. This is called by front ends
449 while transforming the __tm_abort statement. */
451 tree
452 build_tm_abort_call (location_t loc, bool is_outer)
454 return build_call_expr_loc (loc, builtin_decl_explicit (BUILT_IN_TM_ABORT), 1,
455 build_int_cst (integer_type_node,
456 AR_USERABORT
457 | (is_outer ? AR_OUTERABORT : 0)));
460 /* Map for aribtrary function replacement under TM, as created
461 by the tm_wrap attribute. */
463 static GTY((if_marked ("tree_map_marked_p"), param_is (struct tree_map)))
464 htab_t tm_wrap_map;
466 void
467 record_tm_replacement (tree from, tree to)
469 struct tree_map **slot, *h;
471 /* Do not inline wrapper functions that will get replaced in the TM
472 pass.
474 Suppose you have foo() that will get replaced into tmfoo(). Make
475 sure the inliner doesn't try to outsmart us and inline foo()
476 before we get a chance to do the TM replacement. */
477 DECL_UNINLINABLE (from) = 1;
479 if (tm_wrap_map == NULL)
480 tm_wrap_map = htab_create_ggc (32, tree_map_hash, tree_map_eq, 0);
482 h = ggc_alloc<tree_map> ();
483 h->hash = htab_hash_pointer (from);
484 h->base.from = from;
485 h->to = to;
487 slot = (struct tree_map **)
488 htab_find_slot_with_hash (tm_wrap_map, h, h->hash, INSERT);
489 *slot = h;
492 /* Return a TM-aware replacement function for DECL. */
494 static tree
495 find_tm_replacement_function (tree fndecl)
497 if (tm_wrap_map)
499 struct tree_map *h, in;
501 in.base.from = fndecl;
502 in.hash = htab_hash_pointer (fndecl);
503 h = (struct tree_map *) htab_find_with_hash (tm_wrap_map, &in, in.hash);
504 if (h)
505 return h->to;
508 /* ??? We may well want TM versions of most of the common <string.h>
509 functions. For now, we've already these two defined. */
510 /* Adjust expand_call_tm() attributes as necessary for the cases
511 handled here: */
512 if (DECL_BUILT_IN_CLASS (fndecl) == BUILT_IN_NORMAL)
513 switch (DECL_FUNCTION_CODE (fndecl))
515 case BUILT_IN_MEMCPY:
516 return builtin_decl_explicit (BUILT_IN_TM_MEMCPY);
517 case BUILT_IN_MEMMOVE:
518 return builtin_decl_explicit (BUILT_IN_TM_MEMMOVE);
519 case BUILT_IN_MEMSET:
520 return builtin_decl_explicit (BUILT_IN_TM_MEMSET);
521 default:
522 return NULL;
525 return NULL;
528 /* When appropriate, record TM replacement for memory allocation functions.
530 FROM is the FNDECL to wrap. */
531 void
532 tm_malloc_replacement (tree from)
534 const char *str;
535 tree to;
537 if (TREE_CODE (from) != FUNCTION_DECL)
538 return;
540 /* If we have a previous replacement, the user must be explicitly
541 wrapping malloc/calloc/free. They better know what they're
542 doing... */
543 if (find_tm_replacement_function (from))
544 return;
546 str = IDENTIFIER_POINTER (DECL_NAME (from));
548 if (!strcmp (str, "malloc"))
549 to = builtin_decl_explicit (BUILT_IN_TM_MALLOC);
550 else if (!strcmp (str, "calloc"))
551 to = builtin_decl_explicit (BUILT_IN_TM_CALLOC);
552 else if (!strcmp (str, "free"))
553 to = builtin_decl_explicit (BUILT_IN_TM_FREE);
554 else
555 return;
557 TREE_NOTHROW (to) = 0;
559 record_tm_replacement (from, to);
562 /* Diagnostics for tm_safe functions/regions. Called by the front end
563 once we've lowered the function to high-gimple. */
565 /* Subroutine of diagnose_tm_safe_errors, called through walk_gimple_seq.
566 Process exactly one statement. WI->INFO is set to non-null when in
567 the context of a tm_safe function, and null for a __transaction block. */
569 #define DIAG_TM_OUTER 1
570 #define DIAG_TM_SAFE 2
571 #define DIAG_TM_RELAXED 4
573 struct diagnose_tm
575 unsigned int summary_flags : 8;
576 unsigned int block_flags : 8;
577 unsigned int func_flags : 8;
578 unsigned int saw_volatile : 1;
579 gimple stmt;
582 /* Return true if T is a volatile variable of some kind. */
584 static bool
585 volatile_var_p (tree t)
587 return (SSA_VAR_P (t)
588 && TREE_THIS_VOLATILE (TREE_TYPE (t)));
591 /* Tree callback function for diagnose_tm pass. */
593 static tree
594 diagnose_tm_1_op (tree *tp, int *walk_subtrees ATTRIBUTE_UNUSED,
595 void *data)
597 struct walk_stmt_info *wi = (struct walk_stmt_info *) data;
598 struct diagnose_tm *d = (struct diagnose_tm *) wi->info;
600 if (volatile_var_p (*tp)
601 && d->block_flags & DIAG_TM_SAFE
602 && !d->saw_volatile)
604 d->saw_volatile = 1;
605 error_at (gimple_location (d->stmt),
606 "invalid volatile use of %qD inside transaction",
607 *tp);
610 return NULL_TREE;
613 static inline bool
614 is_tm_safe_or_pure (const_tree x)
616 return is_tm_safe (x) || is_tm_pure (x);
619 static tree
620 diagnose_tm_1 (gimple_stmt_iterator *gsi, bool *handled_ops_p,
621 struct walk_stmt_info *wi)
623 gimple stmt = gsi_stmt (*gsi);
624 struct diagnose_tm *d = (struct diagnose_tm *) wi->info;
626 /* Save stmt for use in leaf analysis. */
627 d->stmt = stmt;
629 switch (gimple_code (stmt))
631 case GIMPLE_CALL:
633 tree fn = gimple_call_fn (stmt);
635 if ((d->summary_flags & DIAG_TM_OUTER) == 0
636 && is_tm_may_cancel_outer (fn))
637 error_at (gimple_location (stmt),
638 "%<transaction_may_cancel_outer%> function call not within"
639 " outer transaction or %<transaction_may_cancel_outer%>");
641 if (d->summary_flags & DIAG_TM_SAFE)
643 bool is_safe, direct_call_p;
644 tree replacement;
646 if (TREE_CODE (fn) == ADDR_EXPR
647 && TREE_CODE (TREE_OPERAND (fn, 0)) == FUNCTION_DECL)
649 direct_call_p = true;
650 replacement = TREE_OPERAND (fn, 0);
651 replacement = find_tm_replacement_function (replacement);
652 if (replacement)
653 fn = replacement;
655 else
657 direct_call_p = false;
658 replacement = NULL_TREE;
661 if (is_tm_safe_or_pure (fn))
662 is_safe = true;
663 else if (is_tm_callable (fn) || is_tm_irrevocable (fn))
665 /* A function explicitly marked transaction_callable as
666 opposed to transaction_safe is being defined to be
667 unsafe as part of its ABI, regardless of its contents. */
668 is_safe = false;
670 else if (direct_call_p)
672 if (IS_TYPE_OR_DECL_P (fn)
673 && flags_from_decl_or_type (fn) & ECF_TM_BUILTIN)
674 is_safe = true;
675 else if (replacement)
677 /* ??? At present we've been considering replacements
678 merely transaction_callable, and therefore might
679 enter irrevocable. The tm_wrap attribute has not
680 yet made it into the new language spec. */
681 is_safe = false;
683 else
685 /* ??? Diagnostics for unmarked direct calls moved into
686 the IPA pass. Section 3.2 of the spec details how
687 functions not marked should be considered "implicitly
688 safe" based on having examined the function body. */
689 is_safe = true;
692 else
694 /* An unmarked indirect call. Consider it unsafe even
695 though optimization may yet figure out how to inline. */
696 is_safe = false;
699 if (!is_safe)
701 if (TREE_CODE (fn) == ADDR_EXPR)
702 fn = TREE_OPERAND (fn, 0);
703 if (d->block_flags & DIAG_TM_SAFE)
705 if (direct_call_p)
706 error_at (gimple_location (stmt),
707 "unsafe function call %qD within "
708 "atomic transaction", fn);
709 else
711 if (!DECL_P (fn) || DECL_NAME (fn))
712 error_at (gimple_location (stmt),
713 "unsafe function call %qE within "
714 "atomic transaction", fn);
715 else
716 error_at (gimple_location (stmt),
717 "unsafe indirect function call within "
718 "atomic transaction");
721 else
723 if (direct_call_p)
724 error_at (gimple_location (stmt),
725 "unsafe function call %qD within "
726 "%<transaction_safe%> function", fn);
727 else
729 if (!DECL_P (fn) || DECL_NAME (fn))
730 error_at (gimple_location (stmt),
731 "unsafe function call %qE within "
732 "%<transaction_safe%> function", fn);
733 else
734 error_at (gimple_location (stmt),
735 "unsafe indirect function call within "
736 "%<transaction_safe%> function");
742 break;
744 case GIMPLE_ASM:
745 /* ??? We ought to come up with a way to add attributes to
746 asm statements, and then add "transaction_safe" to it.
747 Either that or get the language spec to resurrect __tm_waiver. */
748 if (d->block_flags & DIAG_TM_SAFE)
749 error_at (gimple_location (stmt),
750 "asm not allowed in atomic transaction");
751 else if (d->func_flags & DIAG_TM_SAFE)
752 error_at (gimple_location (stmt),
753 "asm not allowed in %<transaction_safe%> function");
754 break;
756 case GIMPLE_TRANSACTION:
758 unsigned char inner_flags = DIAG_TM_SAFE;
760 if (gimple_transaction_subcode (stmt) & GTMA_IS_RELAXED)
762 if (d->block_flags & DIAG_TM_SAFE)
763 error_at (gimple_location (stmt),
764 "relaxed transaction in atomic transaction");
765 else if (d->func_flags & DIAG_TM_SAFE)
766 error_at (gimple_location (stmt),
767 "relaxed transaction in %<transaction_safe%> function");
768 inner_flags = DIAG_TM_RELAXED;
770 else if (gimple_transaction_subcode (stmt) & GTMA_IS_OUTER)
772 if (d->block_flags)
773 error_at (gimple_location (stmt),
774 "outer transaction in transaction");
775 else if (d->func_flags & DIAG_TM_OUTER)
776 error_at (gimple_location (stmt),
777 "outer transaction in "
778 "%<transaction_may_cancel_outer%> function");
779 else if (d->func_flags & DIAG_TM_SAFE)
780 error_at (gimple_location (stmt),
781 "outer transaction in %<transaction_safe%> function");
782 inner_flags |= DIAG_TM_OUTER;
785 *handled_ops_p = true;
786 if (gimple_transaction_body (stmt))
788 struct walk_stmt_info wi_inner;
789 struct diagnose_tm d_inner;
791 memset (&d_inner, 0, sizeof (d_inner));
792 d_inner.func_flags = d->func_flags;
793 d_inner.block_flags = d->block_flags | inner_flags;
794 d_inner.summary_flags = d_inner.func_flags | d_inner.block_flags;
796 memset (&wi_inner, 0, sizeof (wi_inner));
797 wi_inner.info = &d_inner;
799 walk_gimple_seq (gimple_transaction_body (stmt),
800 diagnose_tm_1, diagnose_tm_1_op, &wi_inner);
803 break;
805 default:
806 break;
809 return NULL_TREE;
812 static unsigned int
813 diagnose_tm_blocks (void)
815 struct walk_stmt_info wi;
816 struct diagnose_tm d;
818 memset (&d, 0, sizeof (d));
819 if (is_tm_may_cancel_outer (current_function_decl))
820 d.func_flags = DIAG_TM_OUTER | DIAG_TM_SAFE;
821 else if (is_tm_safe (current_function_decl))
822 d.func_flags = DIAG_TM_SAFE;
823 d.summary_flags = d.func_flags;
825 memset (&wi, 0, sizeof (wi));
826 wi.info = &d;
828 walk_gimple_seq (gimple_body (current_function_decl),
829 diagnose_tm_1, diagnose_tm_1_op, &wi);
831 return 0;
834 namespace {
836 const pass_data pass_data_diagnose_tm_blocks =
838 GIMPLE_PASS, /* type */
839 "*diagnose_tm_blocks", /* name */
840 OPTGROUP_NONE, /* optinfo_flags */
841 true, /* has_execute */
842 TV_TRANS_MEM, /* tv_id */
843 PROP_gimple_any, /* properties_required */
844 0, /* properties_provided */
845 0, /* properties_destroyed */
846 0, /* todo_flags_start */
847 0, /* todo_flags_finish */
850 class pass_diagnose_tm_blocks : public gimple_opt_pass
852 public:
853 pass_diagnose_tm_blocks (gcc::context *ctxt)
854 : gimple_opt_pass (pass_data_diagnose_tm_blocks, ctxt)
857 /* opt_pass methods: */
858 virtual bool gate (function *) { return flag_tm; }
859 virtual unsigned int execute (function *) { return diagnose_tm_blocks (); }
861 }; // class pass_diagnose_tm_blocks
863 } // anon namespace
865 gimple_opt_pass *
866 make_pass_diagnose_tm_blocks (gcc::context *ctxt)
868 return new pass_diagnose_tm_blocks (ctxt);
871 /* Instead of instrumenting thread private memory, we save the
872 addresses in a log which we later use to save/restore the addresses
873 upon transaction start/restart.
875 The log is keyed by address, where each element contains individual
876 statements among different code paths that perform the store.
878 This log is later used to generate either plain save/restore of the
879 addresses upon transaction start/restart, or calls to the ITM_L*
880 logging functions.
882 So for something like:
884 struct large { int x[1000]; };
885 struct large lala = { 0 };
886 __transaction {
887 lala.x[i] = 123;
891 We can either save/restore:
893 lala = { 0 };
894 trxn = _ITM_startTransaction ();
895 if (trxn & a_saveLiveVariables)
896 tmp_lala1 = lala.x[i];
897 else if (a & a_restoreLiveVariables)
898 lala.x[i] = tmp_lala1;
900 or use the logging functions:
902 lala = { 0 };
903 trxn = _ITM_startTransaction ();
904 _ITM_LU4 (&lala.x[i]);
906 Obviously, if we use _ITM_L* to log, we prefer to call _ITM_L* as
907 far up the dominator tree to shadow all of the writes to a given
908 location (thus reducing the total number of logging calls), but not
909 so high as to be called on a path that does not perform a
910 write. */
912 /* One individual log entry. We may have multiple statements for the
913 same location if neither dominate each other (on different
914 execution paths). */
915 typedef struct tm_log_entry
917 /* Address to save. */
918 tree addr;
919 /* Entry block for the transaction this address occurs in. */
920 basic_block entry_block;
921 /* Dominating statements the store occurs in. */
922 gimple_vec stmts;
923 /* Initially, while we are building the log, we place a nonzero
924 value here to mean that this address *will* be saved with a
925 save/restore sequence. Later, when generating the save sequence
926 we place the SSA temp generated here. */
927 tree save_var;
928 } *tm_log_entry_t;
931 /* Log entry hashtable helpers. */
933 struct log_entry_hasher
935 typedef tm_log_entry value_type;
936 typedef tm_log_entry compare_type;
937 static inline hashval_t hash (const value_type *);
938 static inline bool equal (const value_type *, const compare_type *);
939 static inline void remove (value_type *);
942 /* Htab support. Return hash value for a `tm_log_entry'. */
943 inline hashval_t
944 log_entry_hasher::hash (const value_type *log)
946 return iterative_hash_expr (log->addr, 0);
949 /* Htab support. Return true if two log entries are the same. */
950 inline bool
951 log_entry_hasher::equal (const value_type *log1, const compare_type *log2)
953 /* FIXME:
955 rth: I suggest that we get rid of the component refs etc.
956 I.e. resolve the reference to base + offset.
958 We may need to actually finish a merge with mainline for this,
959 since we'd like to be presented with Richi's MEM_REF_EXPRs more
960 often than not. But in the meantime your tm_log_entry could save
961 the results of get_inner_reference.
963 See: g++.dg/tm/pr46653.C
966 /* Special case plain equality because operand_equal_p() below will
967 return FALSE if the addresses are equal but they have
968 side-effects (e.g. a volatile address). */
969 if (log1->addr == log2->addr)
970 return true;
972 return operand_equal_p (log1->addr, log2->addr, 0);
975 /* Htab support. Free one tm_log_entry. */
976 inline void
977 log_entry_hasher::remove (value_type *lp)
979 lp->stmts.release ();
980 free (lp);
984 /* The actual log. */
985 static hash_table <log_entry_hasher> tm_log;
987 /* Addresses to log with a save/restore sequence. These should be in
988 dominator order. */
989 static vec<tree> tm_log_save_addresses;
991 enum thread_memory_type
993 mem_non_local = 0,
994 mem_thread_local,
995 mem_transaction_local,
996 mem_max
999 typedef struct tm_new_mem_map
1001 /* SSA_NAME being dereferenced. */
1002 tree val;
1003 enum thread_memory_type local_new_memory;
1004 } tm_new_mem_map_t;
1006 /* Hashtable helpers. */
1008 struct tm_mem_map_hasher : typed_free_remove <tm_new_mem_map_t>
1010 typedef tm_new_mem_map_t value_type;
1011 typedef tm_new_mem_map_t compare_type;
1012 static inline hashval_t hash (const value_type *);
1013 static inline bool equal (const value_type *, const compare_type *);
1016 inline hashval_t
1017 tm_mem_map_hasher::hash (const value_type *v)
1019 return (intptr_t)v->val >> 4;
1022 inline bool
1023 tm_mem_map_hasher::equal (const value_type *v, const compare_type *c)
1025 return v->val == c->val;
1028 /* Map for an SSA_NAME originally pointing to a non aliased new piece
1029 of memory (malloc, alloc, etc). */
1030 static hash_table <tm_mem_map_hasher> tm_new_mem_hash;
1032 /* Initialize logging data structures. */
1033 static void
1034 tm_log_init (void)
1036 tm_log.create (10);
1037 tm_new_mem_hash.create (5);
1038 tm_log_save_addresses.create (5);
1041 /* Free logging data structures. */
1042 static void
1043 tm_log_delete (void)
1045 tm_log.dispose ();
1046 tm_new_mem_hash.dispose ();
1047 tm_log_save_addresses.release ();
1050 /* Return true if MEM is a transaction invariant memory for the TM
1051 region starting at REGION_ENTRY_BLOCK. */
1052 static bool
1053 transaction_invariant_address_p (const_tree mem, basic_block region_entry_block)
1055 if ((TREE_CODE (mem) == INDIRECT_REF || TREE_CODE (mem) == MEM_REF)
1056 && TREE_CODE (TREE_OPERAND (mem, 0)) == SSA_NAME)
1058 basic_block def_bb;
1060 def_bb = gimple_bb (SSA_NAME_DEF_STMT (TREE_OPERAND (mem, 0)));
1061 return def_bb != region_entry_block
1062 && dominated_by_p (CDI_DOMINATORS, region_entry_block, def_bb);
1065 mem = strip_invariant_refs (mem);
1066 return mem && (CONSTANT_CLASS_P (mem) || decl_address_invariant_p (mem));
1069 /* Given an address ADDR in STMT, find it in the memory log or add it,
1070 making sure to keep only the addresses highest in the dominator
1071 tree.
1073 ENTRY_BLOCK is the entry_block for the transaction.
1075 If we find the address in the log, make sure it's either the same
1076 address, or an equivalent one that dominates ADDR.
1078 If we find the address, but neither ADDR dominates the found
1079 address, nor the found one dominates ADDR, we're on different
1080 execution paths. Add it.
1082 If known, ENTRY_BLOCK is the entry block for the region, otherwise
1083 NULL. */
1084 static void
1085 tm_log_add (basic_block entry_block, tree addr, gimple stmt)
1087 tm_log_entry **slot;
1088 struct tm_log_entry l, *lp;
1090 l.addr = addr;
1091 slot = tm_log.find_slot (&l, INSERT);
1092 if (!*slot)
1094 tree type = TREE_TYPE (addr);
1096 lp = XNEW (struct tm_log_entry);
1097 lp->addr = addr;
1098 *slot = lp;
1100 /* Small invariant addresses can be handled as save/restores. */
1101 if (entry_block
1102 && transaction_invariant_address_p (lp->addr, entry_block)
1103 && TYPE_SIZE_UNIT (type) != NULL
1104 && tree_fits_uhwi_p (TYPE_SIZE_UNIT (type))
1105 && ((HOST_WIDE_INT) tree_to_uhwi (TYPE_SIZE_UNIT (type))
1106 < PARAM_VALUE (PARAM_TM_MAX_AGGREGATE_SIZE))
1107 /* We must be able to copy this type normally. I.e., no
1108 special constructors and the like. */
1109 && !TREE_ADDRESSABLE (type))
1111 lp->save_var = create_tmp_reg (TREE_TYPE (lp->addr), "tm_save");
1112 lp->stmts.create (0);
1113 lp->entry_block = entry_block;
1114 /* Save addresses separately in dominator order so we don't
1115 get confused by overlapping addresses in the save/restore
1116 sequence. */
1117 tm_log_save_addresses.safe_push (lp->addr);
1119 else
1121 /* Use the logging functions. */
1122 lp->stmts.create (5);
1123 lp->stmts.quick_push (stmt);
1124 lp->save_var = NULL;
1127 else
1129 size_t i;
1130 gimple oldstmt;
1132 lp = *slot;
1134 /* If we're generating a save/restore sequence, we don't care
1135 about statements. */
1136 if (lp->save_var)
1137 return;
1139 for (i = 0; lp->stmts.iterate (i, &oldstmt); ++i)
1141 if (stmt == oldstmt)
1142 return;
1143 /* We already have a store to the same address, higher up the
1144 dominator tree. Nothing to do. */
1145 if (dominated_by_p (CDI_DOMINATORS,
1146 gimple_bb (stmt), gimple_bb (oldstmt)))
1147 return;
1148 /* We should be processing blocks in dominator tree order. */
1149 gcc_assert (!dominated_by_p (CDI_DOMINATORS,
1150 gimple_bb (oldstmt), gimple_bb (stmt)));
1152 /* Store is on a different code path. */
1153 lp->stmts.safe_push (stmt);
1157 /* Gimplify the address of a TARGET_MEM_REF. Return the SSA_NAME
1158 result, insert the new statements before GSI. */
1160 static tree
1161 gimplify_addr (gimple_stmt_iterator *gsi, tree x)
1163 if (TREE_CODE (x) == TARGET_MEM_REF)
1164 x = tree_mem_ref_addr (build_pointer_type (TREE_TYPE (x)), x);
1165 else
1166 x = build_fold_addr_expr (x);
1167 return force_gimple_operand_gsi (gsi, x, true, NULL, true, GSI_SAME_STMT);
1170 /* Instrument one address with the logging functions.
1171 ADDR is the address to save.
1172 STMT is the statement before which to place it. */
1173 static void
1174 tm_log_emit_stmt (tree addr, gimple stmt)
1176 tree type = TREE_TYPE (addr);
1177 tree size = TYPE_SIZE_UNIT (type);
1178 gimple_stmt_iterator gsi = gsi_for_stmt (stmt);
1179 gimple log;
1180 enum built_in_function code = BUILT_IN_TM_LOG;
1182 if (type == float_type_node)
1183 code = BUILT_IN_TM_LOG_FLOAT;
1184 else if (type == double_type_node)
1185 code = BUILT_IN_TM_LOG_DOUBLE;
1186 else if (type == long_double_type_node)
1187 code = BUILT_IN_TM_LOG_LDOUBLE;
1188 else if (tree_fits_uhwi_p (size))
1190 unsigned int n = tree_to_uhwi (size);
1191 switch (n)
1193 case 1:
1194 code = BUILT_IN_TM_LOG_1;
1195 break;
1196 case 2:
1197 code = BUILT_IN_TM_LOG_2;
1198 break;
1199 case 4:
1200 code = BUILT_IN_TM_LOG_4;
1201 break;
1202 case 8:
1203 code = BUILT_IN_TM_LOG_8;
1204 break;
1205 default:
1206 code = BUILT_IN_TM_LOG;
1207 if (TREE_CODE (type) == VECTOR_TYPE)
1209 if (n == 8 && builtin_decl_explicit (BUILT_IN_TM_LOG_M64))
1210 code = BUILT_IN_TM_LOG_M64;
1211 else if (n == 16 && builtin_decl_explicit (BUILT_IN_TM_LOG_M128))
1212 code = BUILT_IN_TM_LOG_M128;
1213 else if (n == 32 && builtin_decl_explicit (BUILT_IN_TM_LOG_M256))
1214 code = BUILT_IN_TM_LOG_M256;
1216 break;
1220 addr = gimplify_addr (&gsi, addr);
1221 if (code == BUILT_IN_TM_LOG)
1222 log = gimple_build_call (builtin_decl_explicit (code), 2, addr, size);
1223 else
1224 log = gimple_build_call (builtin_decl_explicit (code), 1, addr);
1225 gsi_insert_before (&gsi, log, GSI_SAME_STMT);
1228 /* Go through the log and instrument address that must be instrumented
1229 with the logging functions. Leave the save/restore addresses for
1230 later. */
1231 static void
1232 tm_log_emit (void)
1234 hash_table <log_entry_hasher>::iterator hi;
1235 struct tm_log_entry *lp;
1237 FOR_EACH_HASH_TABLE_ELEMENT (tm_log, lp, tm_log_entry_t, hi)
1239 size_t i;
1240 gimple stmt;
1242 if (dump_file)
1244 fprintf (dump_file, "TM thread private mem logging: ");
1245 print_generic_expr (dump_file, lp->addr, 0);
1246 fprintf (dump_file, "\n");
1249 if (lp->save_var)
1251 if (dump_file)
1252 fprintf (dump_file, "DUMPING to variable\n");
1253 continue;
1255 else
1257 if (dump_file)
1258 fprintf (dump_file, "DUMPING with logging functions\n");
1259 for (i = 0; lp->stmts.iterate (i, &stmt); ++i)
1260 tm_log_emit_stmt (lp->addr, stmt);
1265 /* Emit the save sequence for the corresponding addresses in the log.
1266 ENTRY_BLOCK is the entry block for the transaction.
1267 BB is the basic block to insert the code in. */
1268 static void
1269 tm_log_emit_saves (basic_block entry_block, basic_block bb)
1271 size_t i;
1272 gimple_stmt_iterator gsi = gsi_last_bb (bb);
1273 gimple stmt;
1274 struct tm_log_entry l, *lp;
1276 for (i = 0; i < tm_log_save_addresses.length (); ++i)
1278 l.addr = tm_log_save_addresses[i];
1279 lp = *(tm_log.find_slot (&l, NO_INSERT));
1280 gcc_assert (lp->save_var != NULL);
1282 /* We only care about variables in the current transaction. */
1283 if (lp->entry_block != entry_block)
1284 continue;
1286 stmt = gimple_build_assign (lp->save_var, unshare_expr (lp->addr));
1288 /* Make sure we can create an SSA_NAME for this type. For
1289 instance, aggregates aren't allowed, in which case the system
1290 will create a VOP for us and everything will just work. */
1291 if (is_gimple_reg_type (TREE_TYPE (lp->save_var)))
1293 lp->save_var = make_ssa_name (lp->save_var, stmt);
1294 gimple_assign_set_lhs (stmt, lp->save_var);
1297 gsi_insert_before (&gsi, stmt, GSI_SAME_STMT);
1301 /* Emit the restore sequence for the corresponding addresses in the log.
1302 ENTRY_BLOCK is the entry block for the transaction.
1303 BB is the basic block to insert the code in. */
1304 static void
1305 tm_log_emit_restores (basic_block entry_block, basic_block bb)
1307 int i;
1308 struct tm_log_entry l, *lp;
1309 gimple_stmt_iterator gsi;
1310 gimple stmt;
1312 for (i = tm_log_save_addresses.length () - 1; i >= 0; i--)
1314 l.addr = tm_log_save_addresses[i];
1315 lp = *(tm_log.find_slot (&l, NO_INSERT));
1316 gcc_assert (lp->save_var != NULL);
1318 /* We only care about variables in the current transaction. */
1319 if (lp->entry_block != entry_block)
1320 continue;
1322 /* Restores are in LIFO order from the saves in case we have
1323 overlaps. */
1324 gsi = gsi_start_bb (bb);
1326 stmt = gimple_build_assign (unshare_expr (lp->addr), lp->save_var);
1327 gsi_insert_after (&gsi, stmt, GSI_CONTINUE_LINKING);
1332 static tree lower_sequence_tm (gimple_stmt_iterator *, bool *,
1333 struct walk_stmt_info *);
1334 static tree lower_sequence_no_tm (gimple_stmt_iterator *, bool *,
1335 struct walk_stmt_info *);
1337 /* Evaluate an address X being dereferenced and determine if it
1338 originally points to a non aliased new chunk of memory (malloc,
1339 alloca, etc).
1341 Return MEM_THREAD_LOCAL if it points to a thread-local address.
1342 Return MEM_TRANSACTION_LOCAL if it points to a transaction-local address.
1343 Return MEM_NON_LOCAL otherwise.
1345 ENTRY_BLOCK is the entry block to the transaction containing the
1346 dereference of X. */
1347 static enum thread_memory_type
1348 thread_private_new_memory (basic_block entry_block, tree x)
1350 gimple stmt = NULL;
1351 enum tree_code code;
1352 tm_new_mem_map_t **slot;
1353 tm_new_mem_map_t elt, *elt_p;
1354 tree val = x;
1355 enum thread_memory_type retval = mem_transaction_local;
1357 if (!entry_block
1358 || TREE_CODE (x) != SSA_NAME
1359 /* Possible uninitialized use, or a function argument. In
1360 either case, we don't care. */
1361 || SSA_NAME_IS_DEFAULT_DEF (x))
1362 return mem_non_local;
1364 /* Look in cache first. */
1365 elt.val = x;
1366 slot = tm_new_mem_hash.find_slot (&elt, INSERT);
1367 elt_p = *slot;
1368 if (elt_p)
1369 return elt_p->local_new_memory;
1371 /* Optimistically assume the memory is transaction local during
1372 processing. This catches recursion into this variable. */
1373 *slot = elt_p = XNEW (tm_new_mem_map_t);
1374 elt_p->val = val;
1375 elt_p->local_new_memory = mem_transaction_local;
1377 /* Search DEF chain to find the original definition of this address. */
1380 if (ptr_deref_may_alias_global_p (x))
1382 /* Address escapes. This is not thread-private. */
1383 retval = mem_non_local;
1384 goto new_memory_ret;
1387 stmt = SSA_NAME_DEF_STMT (x);
1389 /* If the malloc call is outside the transaction, this is
1390 thread-local. */
1391 if (retval != mem_thread_local
1392 && !dominated_by_p (CDI_DOMINATORS, gimple_bb (stmt), entry_block))
1393 retval = mem_thread_local;
1395 if (is_gimple_assign (stmt))
1397 code = gimple_assign_rhs_code (stmt);
1398 /* x = foo ==> foo */
1399 if (code == SSA_NAME)
1400 x = gimple_assign_rhs1 (stmt);
1401 /* x = foo + n ==> foo */
1402 else if (code == POINTER_PLUS_EXPR)
1403 x = gimple_assign_rhs1 (stmt);
1404 /* x = (cast*) foo ==> foo */
1405 else if (code == VIEW_CONVERT_EXPR || code == NOP_EXPR)
1406 x = gimple_assign_rhs1 (stmt);
1407 /* x = c ? op1 : op2 == > op1 or op2 just like a PHI */
1408 else if (code == COND_EXPR)
1410 tree op1 = gimple_assign_rhs2 (stmt);
1411 tree op2 = gimple_assign_rhs3 (stmt);
1412 enum thread_memory_type mem;
1413 retval = thread_private_new_memory (entry_block, op1);
1414 if (retval == mem_non_local)
1415 goto new_memory_ret;
1416 mem = thread_private_new_memory (entry_block, op2);
1417 retval = MIN (retval, mem);
1418 goto new_memory_ret;
1420 else
1422 retval = mem_non_local;
1423 goto new_memory_ret;
1426 else
1428 if (gimple_code (stmt) == GIMPLE_PHI)
1430 unsigned int i;
1431 enum thread_memory_type mem;
1432 tree phi_result = gimple_phi_result (stmt);
1434 /* If any of the ancestors are non-local, we are sure to
1435 be non-local. Otherwise we can avoid doing anything
1436 and inherit what has already been generated. */
1437 retval = mem_max;
1438 for (i = 0; i < gimple_phi_num_args (stmt); ++i)
1440 tree op = PHI_ARG_DEF (stmt, i);
1442 /* Exclude self-assignment. */
1443 if (phi_result == op)
1444 continue;
1446 mem = thread_private_new_memory (entry_block, op);
1447 if (mem == mem_non_local)
1449 retval = mem;
1450 goto new_memory_ret;
1452 retval = MIN (retval, mem);
1454 goto new_memory_ret;
1456 break;
1459 while (TREE_CODE (x) == SSA_NAME);
1461 if (stmt && is_gimple_call (stmt) && gimple_call_flags (stmt) & ECF_MALLOC)
1462 /* Thread-local or transaction-local. */
1464 else
1465 retval = mem_non_local;
1467 new_memory_ret:
1468 elt_p->local_new_memory = retval;
1469 return retval;
1472 /* Determine whether X has to be instrumented using a read
1473 or write barrier.
1475 ENTRY_BLOCK is the entry block for the region where stmt resides
1476 in. NULL if unknown.
1478 STMT is the statement in which X occurs in. It is used for thread
1479 private memory instrumentation. If no TPM instrumentation is
1480 desired, STMT should be null. */
1481 static bool
1482 requires_barrier (basic_block entry_block, tree x, gimple stmt)
1484 tree orig = x;
1485 while (handled_component_p (x))
1486 x = TREE_OPERAND (x, 0);
1488 switch (TREE_CODE (x))
1490 case INDIRECT_REF:
1491 case MEM_REF:
1493 enum thread_memory_type ret;
1495 ret = thread_private_new_memory (entry_block, TREE_OPERAND (x, 0));
1496 if (ret == mem_non_local)
1497 return true;
1498 if (stmt && ret == mem_thread_local)
1499 /* ?? Should we pass `orig', or the INDIRECT_REF X. ?? */
1500 tm_log_add (entry_block, orig, stmt);
1502 /* Transaction-locals require nothing at all. For malloc, a
1503 transaction restart frees the memory and we reallocate.
1504 For alloca, the stack pointer gets reset by the retry and
1505 we reallocate. */
1506 return false;
1509 case TARGET_MEM_REF:
1510 if (TREE_CODE (TMR_BASE (x)) != ADDR_EXPR)
1511 return true;
1512 x = TREE_OPERAND (TMR_BASE (x), 0);
1513 if (TREE_CODE (x) == PARM_DECL)
1514 return false;
1515 gcc_assert (TREE_CODE (x) == VAR_DECL);
1516 /* FALLTHRU */
1518 case PARM_DECL:
1519 case RESULT_DECL:
1520 case VAR_DECL:
1521 if (DECL_BY_REFERENCE (x))
1523 /* ??? This value is a pointer, but aggregate_value_p has been
1524 jigged to return true which confuses needs_to_live_in_memory.
1525 This ought to be cleaned up generically.
1527 FIXME: Verify this still happens after the next mainline
1528 merge. Testcase ie g++.dg/tm/pr47554.C.
1530 return false;
1533 if (is_global_var (x))
1534 return !TREE_READONLY (x);
1535 if (/* FIXME: This condition should actually go below in the
1536 tm_log_add() call, however is_call_clobbered() depends on
1537 aliasing info which is not available during
1538 gimplification. Since requires_barrier() gets called
1539 during lower_sequence_tm/gimplification, leave the call
1540 to needs_to_live_in_memory until we eliminate
1541 lower_sequence_tm altogether. */
1542 needs_to_live_in_memory (x))
1543 return true;
1544 else
1546 /* For local memory that doesn't escape (aka thread private
1547 memory), we can either save the value at the beginning of
1548 the transaction and restore on restart, or call a tm
1549 function to dynamically save and restore on restart
1550 (ITM_L*). */
1551 if (stmt)
1552 tm_log_add (entry_block, orig, stmt);
1553 return false;
1556 default:
1557 return false;
1561 /* Mark the GIMPLE_ASSIGN statement as appropriate for being inside
1562 a transaction region. */
1564 static void
1565 examine_assign_tm (unsigned *state, gimple_stmt_iterator *gsi)
1567 gimple stmt = gsi_stmt (*gsi);
1569 if (requires_barrier (/*entry_block=*/NULL, gimple_assign_rhs1 (stmt), NULL))
1570 *state |= GTMA_HAVE_LOAD;
1571 if (requires_barrier (/*entry_block=*/NULL, gimple_assign_lhs (stmt), NULL))
1572 *state |= GTMA_HAVE_STORE;
1575 /* Mark a GIMPLE_CALL as appropriate for being inside a transaction. */
1577 static void
1578 examine_call_tm (unsigned *state, gimple_stmt_iterator *gsi)
1580 gimple stmt = gsi_stmt (*gsi);
1581 tree fn;
1583 if (is_tm_pure_call (stmt))
1584 return;
1586 /* Check if this call is a transaction abort. */
1587 fn = gimple_call_fndecl (stmt);
1588 if (is_tm_abort (fn))
1589 *state |= GTMA_HAVE_ABORT;
1591 /* Note that something may happen. */
1592 *state |= GTMA_HAVE_LOAD | GTMA_HAVE_STORE;
1595 /* Lower a GIMPLE_TRANSACTION statement. */
1597 static void
1598 lower_transaction (gimple_stmt_iterator *gsi, struct walk_stmt_info *wi)
1600 gimple g, stmt = gsi_stmt (*gsi);
1601 unsigned int *outer_state = (unsigned int *) wi->info;
1602 unsigned int this_state = 0;
1603 struct walk_stmt_info this_wi;
1605 /* First, lower the body. The scanning that we do inside gives
1606 us some idea of what we're dealing with. */
1607 memset (&this_wi, 0, sizeof (this_wi));
1608 this_wi.info = (void *) &this_state;
1609 walk_gimple_seq_mod (gimple_transaction_body_ptr (stmt),
1610 lower_sequence_tm, NULL, &this_wi);
1612 /* If there was absolutely nothing transaction related inside the
1613 transaction, we may elide it. Likewise if this is a nested
1614 transaction and does not contain an abort. */
1615 if (this_state == 0
1616 || (!(this_state & GTMA_HAVE_ABORT) && outer_state != NULL))
1618 if (outer_state)
1619 *outer_state |= this_state;
1621 gsi_insert_seq_before (gsi, gimple_transaction_body (stmt),
1622 GSI_SAME_STMT);
1623 gimple_transaction_set_body (stmt, NULL);
1625 gsi_remove (gsi, true);
1626 wi->removed_stmt = true;
1627 return;
1630 /* Wrap the body of the transaction in a try-finally node so that
1631 the commit call is always properly called. */
1632 g = gimple_build_call (builtin_decl_explicit (BUILT_IN_TM_COMMIT), 0);
1633 if (flag_exceptions)
1635 tree ptr;
1636 gimple_seq n_seq, e_seq;
1638 n_seq = gimple_seq_alloc_with_stmt (g);
1639 e_seq = NULL;
1641 g = gimple_build_call (builtin_decl_explicit (BUILT_IN_EH_POINTER),
1642 1, integer_zero_node);
1643 ptr = create_tmp_var (ptr_type_node, NULL);
1644 gimple_call_set_lhs (g, ptr);
1645 gimple_seq_add_stmt (&e_seq, g);
1647 g = gimple_build_call (builtin_decl_explicit (BUILT_IN_TM_COMMIT_EH),
1648 1, ptr);
1649 gimple_seq_add_stmt (&e_seq, g);
1651 g = gimple_build_eh_else (n_seq, e_seq);
1654 g = gimple_build_try (gimple_transaction_body (stmt),
1655 gimple_seq_alloc_with_stmt (g), GIMPLE_TRY_FINALLY);
1656 gsi_insert_after (gsi, g, GSI_CONTINUE_LINKING);
1658 gimple_transaction_set_body (stmt, NULL);
1660 /* If the transaction calls abort or if this is an outer transaction,
1661 add an "over" label afterwards. */
1662 if ((this_state & (GTMA_HAVE_ABORT))
1663 || (gimple_transaction_subcode (stmt) & GTMA_IS_OUTER))
1665 tree label = create_artificial_label (UNKNOWN_LOCATION);
1666 gimple_transaction_set_label (stmt, label);
1667 gsi_insert_after (gsi, gimple_build_label (label), GSI_CONTINUE_LINKING);
1670 /* Record the set of operations found for use later. */
1671 this_state |= gimple_transaction_subcode (stmt) & GTMA_DECLARATION_MASK;
1672 gimple_transaction_set_subcode (stmt, this_state);
1675 /* Iterate through the statements in the sequence, lowering them all
1676 as appropriate for being in a transaction. */
1678 static tree
1679 lower_sequence_tm (gimple_stmt_iterator *gsi, bool *handled_ops_p,
1680 struct walk_stmt_info *wi)
1682 unsigned int *state = (unsigned int *) wi->info;
1683 gimple stmt = gsi_stmt (*gsi);
1685 *handled_ops_p = true;
1686 switch (gimple_code (stmt))
1688 case GIMPLE_ASSIGN:
1689 /* Only memory reads/writes need to be instrumented. */
1690 if (gimple_assign_single_p (stmt))
1691 examine_assign_tm (state, gsi);
1692 break;
1694 case GIMPLE_CALL:
1695 examine_call_tm (state, gsi);
1696 break;
1698 case GIMPLE_ASM:
1699 *state |= GTMA_MAY_ENTER_IRREVOCABLE;
1700 break;
1702 case GIMPLE_TRANSACTION:
1703 lower_transaction (gsi, wi);
1704 break;
1706 default:
1707 *handled_ops_p = !gimple_has_substatements (stmt);
1708 break;
1711 return NULL_TREE;
1714 /* Iterate through the statements in the sequence, lowering them all
1715 as appropriate for being outside of a transaction. */
1717 static tree
1718 lower_sequence_no_tm (gimple_stmt_iterator *gsi, bool *handled_ops_p,
1719 struct walk_stmt_info * wi)
1721 gimple stmt = gsi_stmt (*gsi);
1723 if (gimple_code (stmt) == GIMPLE_TRANSACTION)
1725 *handled_ops_p = true;
1726 lower_transaction (gsi, wi);
1728 else
1729 *handled_ops_p = !gimple_has_substatements (stmt);
1731 return NULL_TREE;
1734 /* Main entry point for flattening GIMPLE_TRANSACTION constructs. After
1735 this, GIMPLE_TRANSACTION nodes still exist, but the nested body has
1736 been moved out, and all the data required for constructing a proper
1737 CFG has been recorded. */
1739 static unsigned int
1740 execute_lower_tm (void)
1742 struct walk_stmt_info wi;
1743 gimple_seq body;
1745 /* Transactional clones aren't created until a later pass. */
1746 gcc_assert (!decl_is_tm_clone (current_function_decl));
1748 body = gimple_body (current_function_decl);
1749 memset (&wi, 0, sizeof (wi));
1750 walk_gimple_seq_mod (&body, lower_sequence_no_tm, NULL, &wi);
1751 gimple_set_body (current_function_decl, body);
1753 return 0;
1756 namespace {
1758 const pass_data pass_data_lower_tm =
1760 GIMPLE_PASS, /* type */
1761 "tmlower", /* name */
1762 OPTGROUP_NONE, /* optinfo_flags */
1763 true, /* has_execute */
1764 TV_TRANS_MEM, /* tv_id */
1765 PROP_gimple_lcf, /* properties_required */
1766 0, /* properties_provided */
1767 0, /* properties_destroyed */
1768 0, /* todo_flags_start */
1769 0, /* todo_flags_finish */
1772 class pass_lower_tm : public gimple_opt_pass
1774 public:
1775 pass_lower_tm (gcc::context *ctxt)
1776 : gimple_opt_pass (pass_data_lower_tm, ctxt)
1779 /* opt_pass methods: */
1780 virtual bool gate (function *) { return flag_tm; }
1781 virtual unsigned int execute (function *) { return execute_lower_tm (); }
1783 }; // class pass_lower_tm
1785 } // anon namespace
1787 gimple_opt_pass *
1788 make_pass_lower_tm (gcc::context *ctxt)
1790 return new pass_lower_tm (ctxt);
1793 /* Collect region information for each transaction. */
1795 struct tm_region
1797 /* Link to the next unnested transaction. */
1798 struct tm_region *next;
1800 /* Link to the next inner transaction. */
1801 struct tm_region *inner;
1803 /* Link to the next outer transaction. */
1804 struct tm_region *outer;
1806 /* The GIMPLE_TRANSACTION statement beginning this transaction.
1807 After TM_MARK, this gets replaced by a call to
1808 BUILT_IN_TM_START. */
1809 gimple transaction_stmt;
1811 /* After TM_MARK expands the GIMPLE_TRANSACTION into a call to
1812 BUILT_IN_TM_START, this field is true if the transaction is an
1813 outer transaction. */
1814 bool original_transaction_was_outer;
1816 /* Return value from BUILT_IN_TM_START. */
1817 tree tm_state;
1819 /* The entry block to this region. This will always be the first
1820 block of the body of the transaction. */
1821 basic_block entry_block;
1823 /* The first block after an expanded call to _ITM_beginTransaction. */
1824 basic_block restart_block;
1826 /* The set of all blocks that end the region; NULL if only EXIT_BLOCK.
1827 These blocks are still a part of the region (i.e., the border is
1828 inclusive). Note that this set is only complete for paths in the CFG
1829 starting at ENTRY_BLOCK, and that there is no exit block recorded for
1830 the edge to the "over" label. */
1831 bitmap exit_blocks;
1833 /* The set of all blocks that have an TM_IRREVOCABLE call. */
1834 bitmap irr_blocks;
1837 typedef struct tm_region *tm_region_p;
1839 /* True if there are pending edge statements to be committed for the
1840 current function being scanned in the tmmark pass. */
1841 bool pending_edge_inserts_p;
1843 static struct tm_region *all_tm_regions;
1844 static bitmap_obstack tm_obstack;
1847 /* A subroutine of tm_region_init. Record the existence of the
1848 GIMPLE_TRANSACTION statement in a tree of tm_region elements. */
1850 static struct tm_region *
1851 tm_region_init_0 (struct tm_region *outer, basic_block bb, gimple stmt)
1853 struct tm_region *region;
1855 region = (struct tm_region *)
1856 obstack_alloc (&tm_obstack.obstack, sizeof (struct tm_region));
1858 if (outer)
1860 region->next = outer->inner;
1861 outer->inner = region;
1863 else
1865 region->next = all_tm_regions;
1866 all_tm_regions = region;
1868 region->inner = NULL;
1869 region->outer = outer;
1871 region->transaction_stmt = stmt;
1872 region->original_transaction_was_outer = false;
1873 region->tm_state = NULL;
1875 /* There are either one or two edges out of the block containing
1876 the GIMPLE_TRANSACTION, one to the actual region and one to the
1877 "over" label if the region contains an abort. The former will
1878 always be the one marked FALLTHRU. */
1879 region->entry_block = FALLTHRU_EDGE (bb)->dest;
1881 region->exit_blocks = BITMAP_ALLOC (&tm_obstack);
1882 region->irr_blocks = BITMAP_ALLOC (&tm_obstack);
1884 return region;
1887 /* A subroutine of tm_region_init. Record all the exit and
1888 irrevocable blocks in BB into the region's exit_blocks and
1889 irr_blocks bitmaps. Returns the new region being scanned. */
1891 static struct tm_region *
1892 tm_region_init_1 (struct tm_region *region, basic_block bb)
1894 gimple_stmt_iterator gsi;
1895 gimple g;
1897 if (!region
1898 || (!region->irr_blocks && !region->exit_blocks))
1899 return region;
1901 /* Check to see if this is the end of a region by seeing if it
1902 contains a call to __builtin_tm_commit{,_eh}. Note that the
1903 outermost region for DECL_IS_TM_CLONE need not collect this. */
1904 for (gsi = gsi_last_bb (bb); !gsi_end_p (gsi); gsi_prev (&gsi))
1906 g = gsi_stmt (gsi);
1907 if (gimple_code (g) == GIMPLE_CALL)
1909 tree fn = gimple_call_fndecl (g);
1910 if (fn && DECL_BUILT_IN_CLASS (fn) == BUILT_IN_NORMAL)
1912 if ((DECL_FUNCTION_CODE (fn) == BUILT_IN_TM_COMMIT
1913 || DECL_FUNCTION_CODE (fn) == BUILT_IN_TM_COMMIT_EH)
1914 && region->exit_blocks)
1916 bitmap_set_bit (region->exit_blocks, bb->index);
1917 region = region->outer;
1918 break;
1920 if (DECL_FUNCTION_CODE (fn) == BUILT_IN_TM_IRREVOCABLE)
1921 bitmap_set_bit (region->irr_blocks, bb->index);
1925 return region;
1928 /* Collect all of the transaction regions within the current function
1929 and record them in ALL_TM_REGIONS. The REGION parameter may specify
1930 an "outermost" region for use by tm clones. */
1932 static void
1933 tm_region_init (struct tm_region *region)
1935 gimple g;
1936 edge_iterator ei;
1937 edge e;
1938 basic_block bb;
1939 auto_vec<basic_block> queue;
1940 bitmap visited_blocks = BITMAP_ALLOC (NULL);
1941 struct tm_region *old_region;
1942 auto_vec<tm_region_p> bb_regions;
1944 all_tm_regions = region;
1945 bb = single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun));
1947 /* We could store this information in bb->aux, but we may get called
1948 through get_all_tm_blocks() from another pass that may be already
1949 using bb->aux. */
1950 bb_regions.safe_grow_cleared (last_basic_block_for_fn (cfun));
1952 queue.safe_push (bb);
1953 bb_regions[bb->index] = region;
1956 bb = queue.pop ();
1957 region = bb_regions[bb->index];
1958 bb_regions[bb->index] = NULL;
1960 /* Record exit and irrevocable blocks. */
1961 region = tm_region_init_1 (region, bb);
1963 /* Check for the last statement in the block beginning a new region. */
1964 g = last_stmt (bb);
1965 old_region = region;
1966 if (g && gimple_code (g) == GIMPLE_TRANSACTION)
1967 region = tm_region_init_0 (region, bb, g);
1969 /* Process subsequent blocks. */
1970 FOR_EACH_EDGE (e, ei, bb->succs)
1971 if (!bitmap_bit_p (visited_blocks, e->dest->index))
1973 bitmap_set_bit (visited_blocks, e->dest->index);
1974 queue.safe_push (e->dest);
1976 /* If the current block started a new region, make sure that only
1977 the entry block of the new region is associated with this region.
1978 Other successors are still part of the old region. */
1979 if (old_region != region && e->dest != region->entry_block)
1980 bb_regions[e->dest->index] = old_region;
1981 else
1982 bb_regions[e->dest->index] = region;
1985 while (!queue.is_empty ());
1986 BITMAP_FREE (visited_blocks);
1989 /* The "gate" function for all transactional memory expansion and optimization
1990 passes. We collect region information for each top-level transaction, and
1991 if we don't find any, we skip all of the TM passes. Each region will have
1992 all of the exit blocks recorded, and the originating statement. */
1994 static bool
1995 gate_tm_init (void)
1997 if (!flag_tm)
1998 return false;
2000 calculate_dominance_info (CDI_DOMINATORS);
2001 bitmap_obstack_initialize (&tm_obstack);
2003 /* If the function is a TM_CLONE, then the entire function is the region. */
2004 if (decl_is_tm_clone (current_function_decl))
2006 struct tm_region *region = (struct tm_region *)
2007 obstack_alloc (&tm_obstack.obstack, sizeof (struct tm_region));
2008 memset (region, 0, sizeof (*region));
2009 region->entry_block = single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun));
2010 /* For a clone, the entire function is the region. But even if
2011 we don't need to record any exit blocks, we may need to
2012 record irrevocable blocks. */
2013 region->irr_blocks = BITMAP_ALLOC (&tm_obstack);
2015 tm_region_init (region);
2017 else
2019 tm_region_init (NULL);
2021 /* If we didn't find any regions, cleanup and skip the whole tree
2022 of tm-related optimizations. */
2023 if (all_tm_regions == NULL)
2025 bitmap_obstack_release (&tm_obstack);
2026 return false;
2030 return true;
2033 namespace {
2035 const pass_data pass_data_tm_init =
2037 GIMPLE_PASS, /* type */
2038 "*tminit", /* name */
2039 OPTGROUP_NONE, /* optinfo_flags */
2040 false, /* has_execute */
2041 TV_TRANS_MEM, /* tv_id */
2042 ( PROP_ssa | PROP_cfg ), /* properties_required */
2043 0, /* properties_provided */
2044 0, /* properties_destroyed */
2045 0, /* todo_flags_start */
2046 0, /* todo_flags_finish */
2049 class pass_tm_init : public gimple_opt_pass
2051 public:
2052 pass_tm_init (gcc::context *ctxt)
2053 : gimple_opt_pass (pass_data_tm_init, ctxt)
2056 /* opt_pass methods: */
2057 virtual bool gate (function *) { return gate_tm_init (); }
2059 }; // class pass_tm_init
2061 } // anon namespace
2063 gimple_opt_pass *
2064 make_pass_tm_init (gcc::context *ctxt)
2066 return new pass_tm_init (ctxt);
2069 /* Add FLAGS to the GIMPLE_TRANSACTION subcode for the transaction region
2070 represented by STATE. */
2072 static inline void
2073 transaction_subcode_ior (struct tm_region *region, unsigned flags)
2075 if (region && region->transaction_stmt)
2077 flags |= gimple_transaction_subcode (region->transaction_stmt);
2078 gimple_transaction_set_subcode (region->transaction_stmt, flags);
2082 /* Construct a memory load in a transactional context. Return the
2083 gimple statement performing the load, or NULL if there is no
2084 TM_LOAD builtin of the appropriate size to do the load.
2086 LOC is the location to use for the new statement(s). */
2088 static gimple
2089 build_tm_load (location_t loc, tree lhs, tree rhs, gimple_stmt_iterator *gsi)
2091 enum built_in_function code = END_BUILTINS;
2092 tree t, type = TREE_TYPE (rhs), decl;
2093 gimple gcall;
2095 if (type == float_type_node)
2096 code = BUILT_IN_TM_LOAD_FLOAT;
2097 else if (type == double_type_node)
2098 code = BUILT_IN_TM_LOAD_DOUBLE;
2099 else if (type == long_double_type_node)
2100 code = BUILT_IN_TM_LOAD_LDOUBLE;
2101 else if (TYPE_SIZE_UNIT (type) != NULL
2102 && tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
2104 switch (tree_to_uhwi (TYPE_SIZE_UNIT (type)))
2106 case 1:
2107 code = BUILT_IN_TM_LOAD_1;
2108 break;
2109 case 2:
2110 code = BUILT_IN_TM_LOAD_2;
2111 break;
2112 case 4:
2113 code = BUILT_IN_TM_LOAD_4;
2114 break;
2115 case 8:
2116 code = BUILT_IN_TM_LOAD_8;
2117 break;
2121 if (code == END_BUILTINS)
2123 decl = targetm.vectorize.builtin_tm_load (type);
2124 if (!decl)
2125 return NULL;
2127 else
2128 decl = builtin_decl_explicit (code);
2130 t = gimplify_addr (gsi, rhs);
2131 gcall = gimple_build_call (decl, 1, t);
2132 gimple_set_location (gcall, loc);
2134 t = TREE_TYPE (TREE_TYPE (decl));
2135 if (useless_type_conversion_p (type, t))
2137 gimple_call_set_lhs (gcall, lhs);
2138 gsi_insert_before (gsi, gcall, GSI_SAME_STMT);
2140 else
2142 gimple g;
2143 tree temp;
2145 temp = create_tmp_reg (t, NULL);
2146 gimple_call_set_lhs (gcall, temp);
2147 gsi_insert_before (gsi, gcall, GSI_SAME_STMT);
2149 t = fold_build1 (VIEW_CONVERT_EXPR, type, temp);
2150 g = gimple_build_assign (lhs, t);
2151 gsi_insert_before (gsi, g, GSI_SAME_STMT);
2154 return gcall;
2158 /* Similarly for storing TYPE in a transactional context. */
2160 static gimple
2161 build_tm_store (location_t loc, tree lhs, tree rhs, gimple_stmt_iterator *gsi)
2163 enum built_in_function code = END_BUILTINS;
2164 tree t, fn, type = TREE_TYPE (rhs), simple_type;
2165 gimple gcall;
2167 if (type == float_type_node)
2168 code = BUILT_IN_TM_STORE_FLOAT;
2169 else if (type == double_type_node)
2170 code = BUILT_IN_TM_STORE_DOUBLE;
2171 else if (type == long_double_type_node)
2172 code = BUILT_IN_TM_STORE_LDOUBLE;
2173 else if (TYPE_SIZE_UNIT (type) != NULL
2174 && tree_fits_uhwi_p (TYPE_SIZE_UNIT (type)))
2176 switch (tree_to_uhwi (TYPE_SIZE_UNIT (type)))
2178 case 1:
2179 code = BUILT_IN_TM_STORE_1;
2180 break;
2181 case 2:
2182 code = BUILT_IN_TM_STORE_2;
2183 break;
2184 case 4:
2185 code = BUILT_IN_TM_STORE_4;
2186 break;
2187 case 8:
2188 code = BUILT_IN_TM_STORE_8;
2189 break;
2193 if (code == END_BUILTINS)
2195 fn = targetm.vectorize.builtin_tm_store (type);
2196 if (!fn)
2197 return NULL;
2199 else
2200 fn = builtin_decl_explicit (code);
2202 simple_type = TREE_VALUE (TREE_CHAIN (TYPE_ARG_TYPES (TREE_TYPE (fn))));
2204 if (TREE_CODE (rhs) == CONSTRUCTOR)
2206 /* Handle the easy initialization to zero. */
2207 if (!CONSTRUCTOR_ELTS (rhs))
2208 rhs = build_int_cst (simple_type, 0);
2209 else
2211 /* ...otherwise punt to the caller and probably use
2212 BUILT_IN_TM_MEMMOVE, because we can't wrap a
2213 VIEW_CONVERT_EXPR around a CONSTRUCTOR (below) and produce
2214 valid gimple. */
2215 return NULL;
2218 else if (!useless_type_conversion_p (simple_type, type))
2220 gimple g;
2221 tree temp;
2223 temp = create_tmp_reg (simple_type, NULL);
2224 t = fold_build1 (VIEW_CONVERT_EXPR, simple_type, rhs);
2225 g = gimple_build_assign (temp, t);
2226 gimple_set_location (g, loc);
2227 gsi_insert_before (gsi, g, GSI_SAME_STMT);
2229 rhs = temp;
2232 t = gimplify_addr (gsi, lhs);
2233 gcall = gimple_build_call (fn, 2, t, rhs);
2234 gimple_set_location (gcall, loc);
2235 gsi_insert_before (gsi, gcall, GSI_SAME_STMT);
2237 return gcall;
2241 /* Expand an assignment statement into transactional builtins. */
2243 static void
2244 expand_assign_tm (struct tm_region *region, gimple_stmt_iterator *gsi)
2246 gimple stmt = gsi_stmt (*gsi);
2247 location_t loc = gimple_location (stmt);
2248 tree lhs = gimple_assign_lhs (stmt);
2249 tree rhs = gimple_assign_rhs1 (stmt);
2250 bool store_p = requires_barrier (region->entry_block, lhs, NULL);
2251 bool load_p = requires_barrier (region->entry_block, rhs, NULL);
2252 gimple gcall = NULL;
2254 if (!load_p && !store_p)
2256 /* Add thread private addresses to log if applicable. */
2257 requires_barrier (region->entry_block, lhs, stmt);
2258 gsi_next (gsi);
2259 return;
2262 // Remove original load/store statement.
2263 gsi_remove (gsi, true);
2265 if (load_p && !store_p)
2267 transaction_subcode_ior (region, GTMA_HAVE_LOAD);
2268 gcall = build_tm_load (loc, lhs, rhs, gsi);
2270 else if (store_p && !load_p)
2272 transaction_subcode_ior (region, GTMA_HAVE_STORE);
2273 gcall = build_tm_store (loc, lhs, rhs, gsi);
2275 if (!gcall)
2277 tree lhs_addr, rhs_addr, tmp;
2279 if (load_p)
2280 transaction_subcode_ior (region, GTMA_HAVE_LOAD);
2281 if (store_p)
2282 transaction_subcode_ior (region, GTMA_HAVE_STORE);
2284 /* ??? Figure out if there's any possible overlap between the LHS
2285 and the RHS and if not, use MEMCPY. */
2287 if (load_p && is_gimple_reg (lhs))
2289 tmp = create_tmp_var (TREE_TYPE (lhs), NULL);
2290 lhs_addr = build_fold_addr_expr (tmp);
2292 else
2294 tmp = NULL_TREE;
2295 lhs_addr = gimplify_addr (gsi, lhs);
2297 rhs_addr = gimplify_addr (gsi, rhs);
2298 gcall = gimple_build_call (builtin_decl_explicit (BUILT_IN_TM_MEMMOVE),
2299 3, lhs_addr, rhs_addr,
2300 TYPE_SIZE_UNIT (TREE_TYPE (lhs)));
2301 gimple_set_location (gcall, loc);
2302 gsi_insert_before (gsi, gcall, GSI_SAME_STMT);
2304 if (tmp)
2306 gcall = gimple_build_assign (lhs, tmp);
2307 gsi_insert_before (gsi, gcall, GSI_SAME_STMT);
2311 /* Now that we have the load/store in its instrumented form, add
2312 thread private addresses to the log if applicable. */
2313 if (!store_p)
2314 requires_barrier (region->entry_block, lhs, gcall);
2316 // The calls to build_tm_{store,load} above inserted the instrumented
2317 // call into the stream.
2318 // gsi_insert_before (gsi, gcall, GSI_SAME_STMT);
2322 /* Expand a call statement as appropriate for a transaction. That is,
2323 either verify that the call does not affect the transaction, or
2324 redirect the call to a clone that handles transactions, or change
2325 the transaction state to IRREVOCABLE. Return true if the call is
2326 one of the builtins that end a transaction. */
2328 static bool
2329 expand_call_tm (struct tm_region *region,
2330 gimple_stmt_iterator *gsi)
2332 gimple stmt = gsi_stmt (*gsi);
2333 tree lhs = gimple_call_lhs (stmt);
2334 tree fn_decl;
2335 struct cgraph_node *node;
2336 bool retval = false;
2338 fn_decl = gimple_call_fndecl (stmt);
2340 if (fn_decl == builtin_decl_explicit (BUILT_IN_TM_MEMCPY)
2341 || fn_decl == builtin_decl_explicit (BUILT_IN_TM_MEMMOVE))
2342 transaction_subcode_ior (region, GTMA_HAVE_STORE | GTMA_HAVE_LOAD);
2343 if (fn_decl == builtin_decl_explicit (BUILT_IN_TM_MEMSET))
2344 transaction_subcode_ior (region, GTMA_HAVE_STORE);
2346 if (is_tm_pure_call (stmt))
2347 return false;
2349 if (fn_decl)
2350 retval = is_tm_ending_fndecl (fn_decl);
2351 if (!retval)
2353 /* Assume all non-const/pure calls write to memory, except
2354 transaction ending builtins. */
2355 transaction_subcode_ior (region, GTMA_HAVE_STORE);
2358 /* For indirect calls, we already generated a call into the runtime. */
2359 if (!fn_decl)
2361 tree fn = gimple_call_fn (stmt);
2363 /* We are guaranteed never to go irrevocable on a safe or pure
2364 call, and the pure call was handled above. */
2365 if (is_tm_safe (fn))
2366 return false;
2367 else
2368 transaction_subcode_ior (region, GTMA_MAY_ENTER_IRREVOCABLE);
2370 return false;
2373 node = cgraph_get_node (fn_decl);
2374 /* All calls should have cgraph here. */
2375 if (!node)
2377 /* We can have a nodeless call here if some pass after IPA-tm
2378 added uninstrumented calls. For example, loop distribution
2379 can transform certain loop constructs into __builtin_mem*
2380 calls. In this case, see if we have a suitable TM
2381 replacement and fill in the gaps. */
2382 gcc_assert (DECL_BUILT_IN_CLASS (fn_decl) == BUILT_IN_NORMAL);
2383 enum built_in_function code = DECL_FUNCTION_CODE (fn_decl);
2384 gcc_assert (code == BUILT_IN_MEMCPY
2385 || code == BUILT_IN_MEMMOVE
2386 || code == BUILT_IN_MEMSET);
2388 tree repl = find_tm_replacement_function (fn_decl);
2389 if (repl)
2391 gimple_call_set_fndecl (stmt, repl);
2392 update_stmt (stmt);
2393 node = cgraph_create_node (repl);
2394 node->local.tm_may_enter_irr = false;
2395 return expand_call_tm (region, gsi);
2397 gcc_unreachable ();
2399 if (node->local.tm_may_enter_irr)
2400 transaction_subcode_ior (region, GTMA_MAY_ENTER_IRREVOCABLE);
2402 if (is_tm_abort (fn_decl))
2404 transaction_subcode_ior (region, GTMA_HAVE_ABORT);
2405 return true;
2408 /* Instrument the store if needed.
2410 If the assignment happens inside the function call (return slot
2411 optimization), there is no instrumentation to be done, since
2412 the callee should have done the right thing. */
2413 if (lhs && requires_barrier (region->entry_block, lhs, stmt)
2414 && !gimple_call_return_slot_opt_p (stmt))
2416 tree tmp = create_tmp_reg (TREE_TYPE (lhs), NULL);
2417 location_t loc = gimple_location (stmt);
2418 edge fallthru_edge = NULL;
2420 /* Remember if the call was going to throw. */
2421 if (stmt_can_throw_internal (stmt))
2423 edge_iterator ei;
2424 edge e;
2425 basic_block bb = gimple_bb (stmt);
2427 FOR_EACH_EDGE (e, ei, bb->succs)
2428 if (e->flags & EDGE_FALLTHRU)
2430 fallthru_edge = e;
2431 break;
2435 gimple_call_set_lhs (stmt, tmp);
2436 update_stmt (stmt);
2437 stmt = gimple_build_assign (lhs, tmp);
2438 gimple_set_location (stmt, loc);
2440 /* We cannot throw in the middle of a BB. If the call was going
2441 to throw, place the instrumentation on the fallthru edge, so
2442 the call remains the last statement in the block. */
2443 if (fallthru_edge)
2445 gimple_seq fallthru_seq = gimple_seq_alloc_with_stmt (stmt);
2446 gimple_stmt_iterator fallthru_gsi = gsi_start (fallthru_seq);
2447 expand_assign_tm (region, &fallthru_gsi);
2448 gsi_insert_seq_on_edge (fallthru_edge, fallthru_seq);
2449 pending_edge_inserts_p = true;
2451 else
2453 gsi_insert_after (gsi, stmt, GSI_CONTINUE_LINKING);
2454 expand_assign_tm (region, gsi);
2457 transaction_subcode_ior (region, GTMA_HAVE_STORE);
2460 return retval;
2464 /* Expand all statements in BB as appropriate for being inside
2465 a transaction. */
2467 static void
2468 expand_block_tm (struct tm_region *region, basic_block bb)
2470 gimple_stmt_iterator gsi;
2472 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); )
2474 gimple stmt = gsi_stmt (gsi);
2475 switch (gimple_code (stmt))
2477 case GIMPLE_ASSIGN:
2478 /* Only memory reads/writes need to be instrumented. */
2479 if (gimple_assign_single_p (stmt)
2480 && !gimple_clobber_p (stmt))
2482 expand_assign_tm (region, &gsi);
2483 continue;
2485 break;
2487 case GIMPLE_CALL:
2488 if (expand_call_tm (region, &gsi))
2489 return;
2490 break;
2492 case GIMPLE_ASM:
2493 gcc_unreachable ();
2495 default:
2496 break;
2498 if (!gsi_end_p (gsi))
2499 gsi_next (&gsi);
2503 /* Return the list of basic-blocks in REGION.
2505 STOP_AT_IRREVOCABLE_P is true if caller is uninterested in blocks
2506 following a TM_IRREVOCABLE call.
2508 INCLUDE_UNINSTRUMENTED_P is TRUE if we should include the
2509 uninstrumented code path blocks in the list of basic blocks
2510 returned, false otherwise. */
2512 static vec<basic_block>
2513 get_tm_region_blocks (basic_block entry_block,
2514 bitmap exit_blocks,
2515 bitmap irr_blocks,
2516 bitmap all_region_blocks,
2517 bool stop_at_irrevocable_p,
2518 bool include_uninstrumented_p = true)
2520 vec<basic_block> bbs = vNULL;
2521 unsigned i;
2522 edge e;
2523 edge_iterator ei;
2524 bitmap visited_blocks = BITMAP_ALLOC (NULL);
2526 i = 0;
2527 bbs.safe_push (entry_block);
2528 bitmap_set_bit (visited_blocks, entry_block->index);
2532 basic_block bb = bbs[i++];
2534 if (exit_blocks &&
2535 bitmap_bit_p (exit_blocks, bb->index))
2536 continue;
2538 if (stop_at_irrevocable_p
2539 && irr_blocks
2540 && bitmap_bit_p (irr_blocks, bb->index))
2541 continue;
2543 FOR_EACH_EDGE (e, ei, bb->succs)
2544 if ((include_uninstrumented_p
2545 || !(e->flags & EDGE_TM_UNINSTRUMENTED))
2546 && !bitmap_bit_p (visited_blocks, e->dest->index))
2548 bitmap_set_bit (visited_blocks, e->dest->index);
2549 bbs.safe_push (e->dest);
2552 while (i < bbs.length ());
2554 if (all_region_blocks)
2555 bitmap_ior_into (all_region_blocks, visited_blocks);
2557 BITMAP_FREE (visited_blocks);
2558 return bbs;
2561 // Callback data for collect_bb2reg.
2562 struct bb2reg_stuff
2564 vec<tm_region_p> *bb2reg;
2565 bool include_uninstrumented_p;
2568 // Callback for expand_regions, collect innermost region data for each bb.
2569 static void *
2570 collect_bb2reg (struct tm_region *region, void *data)
2572 struct bb2reg_stuff *stuff = (struct bb2reg_stuff *)data;
2573 vec<tm_region_p> *bb2reg = stuff->bb2reg;
2574 vec<basic_block> queue;
2575 unsigned int i;
2576 basic_block bb;
2578 queue = get_tm_region_blocks (region->entry_block,
2579 region->exit_blocks,
2580 region->irr_blocks,
2581 NULL,
2582 /*stop_at_irr_p=*/true,
2583 stuff->include_uninstrumented_p);
2585 // We expect expand_region to perform a post-order traversal of the region
2586 // tree. Therefore the last region seen for any bb is the innermost.
2587 FOR_EACH_VEC_ELT (queue, i, bb)
2588 (*bb2reg)[bb->index] = region;
2590 queue.release ();
2591 return NULL;
2594 // Returns a vector, indexed by BB->INDEX, of the innermost tm_region to
2595 // which a basic block belongs. Note that we only consider the instrumented
2596 // code paths for the region; the uninstrumented code paths are ignored if
2597 // INCLUDE_UNINSTRUMENTED_P is false.
2599 // ??? This data is very similar to the bb_regions array that is collected
2600 // during tm_region_init. Or, rather, this data is similar to what could
2601 // be used within tm_region_init. The actual computation in tm_region_init
2602 // begins and ends with bb_regions entirely full of NULL pointers, due to
2603 // the way in which pointers are swapped in and out of the array.
2605 // ??? Our callers expect that blocks are not shared between transactions.
2606 // When the optimizers get too smart, and blocks are shared, then during
2607 // the tm_mark phase we'll add log entries to only one of the two transactions,
2608 // and in the tm_edge phase we'll add edges to the CFG that create invalid
2609 // cycles. The symptom being SSA defs that do not dominate their uses.
2610 // Note that the optimizers were locally correct with their transformation,
2611 // as we have no info within the program that suggests that the blocks cannot
2612 // be shared.
2614 // ??? There is currently a hack inside tree-ssa-pre.c to work around the
2615 // only known instance of this block sharing.
2617 static vec<tm_region_p>
2618 get_bb_regions_instrumented (bool traverse_clones,
2619 bool include_uninstrumented_p)
2621 unsigned n = last_basic_block_for_fn (cfun);
2622 struct bb2reg_stuff stuff;
2623 vec<tm_region_p> ret;
2625 ret.create (n);
2626 ret.safe_grow_cleared (n);
2627 stuff.bb2reg = &ret;
2628 stuff.include_uninstrumented_p = include_uninstrumented_p;
2629 expand_regions (all_tm_regions, collect_bb2reg, &stuff, traverse_clones);
2631 return ret;
2634 /* Set the IN_TRANSACTION for all gimple statements that appear in a
2635 transaction. */
2637 void
2638 compute_transaction_bits (void)
2640 struct tm_region *region;
2641 vec<basic_block> queue;
2642 unsigned int i;
2643 basic_block bb;
2645 /* ?? Perhaps we need to abstract gate_tm_init further, because we
2646 certainly don't need it to calculate CDI_DOMINATOR info. */
2647 gate_tm_init ();
2649 FOR_EACH_BB_FN (bb, cfun)
2650 bb->flags &= ~BB_IN_TRANSACTION;
2652 for (region = all_tm_regions; region; region = region->next)
2654 queue = get_tm_region_blocks (region->entry_block,
2655 region->exit_blocks,
2656 region->irr_blocks,
2657 NULL,
2658 /*stop_at_irr_p=*/true);
2659 for (i = 0; queue.iterate (i, &bb); ++i)
2660 bb->flags |= BB_IN_TRANSACTION;
2661 queue.release ();
2664 if (all_tm_regions)
2665 bitmap_obstack_release (&tm_obstack);
2668 /* Replace the GIMPLE_TRANSACTION in this region with the corresponding
2669 call to BUILT_IN_TM_START. */
2671 static void *
2672 expand_transaction (struct tm_region *region, void *data ATTRIBUTE_UNUSED)
2674 tree tm_start = builtin_decl_explicit (BUILT_IN_TM_START);
2675 basic_block transaction_bb = gimple_bb (region->transaction_stmt);
2676 tree tm_state = region->tm_state;
2677 tree tm_state_type = TREE_TYPE (tm_state);
2678 edge abort_edge = NULL;
2679 edge inst_edge = NULL;
2680 edge uninst_edge = NULL;
2681 edge fallthru_edge = NULL;
2683 // Identify the various successors of the transaction start.
2685 edge_iterator i;
2686 edge e;
2687 FOR_EACH_EDGE (e, i, transaction_bb->succs)
2689 if (e->flags & EDGE_TM_ABORT)
2690 abort_edge = e;
2691 else if (e->flags & EDGE_TM_UNINSTRUMENTED)
2692 uninst_edge = e;
2693 else
2694 inst_edge = e;
2695 if (e->flags & EDGE_FALLTHRU)
2696 fallthru_edge = e;
2700 /* ??? There are plenty of bits here we're not computing. */
2702 int subcode = gimple_transaction_subcode (region->transaction_stmt);
2703 int flags = 0;
2704 if (subcode & GTMA_DOES_GO_IRREVOCABLE)
2705 flags |= PR_DOESGOIRREVOCABLE;
2706 if ((subcode & GTMA_MAY_ENTER_IRREVOCABLE) == 0)
2707 flags |= PR_HASNOIRREVOCABLE;
2708 /* If the transaction does not have an abort in lexical scope and is not
2709 marked as an outer transaction, then it will never abort. */
2710 if ((subcode & GTMA_HAVE_ABORT) == 0 && (subcode & GTMA_IS_OUTER) == 0)
2711 flags |= PR_HASNOABORT;
2712 if ((subcode & GTMA_HAVE_STORE) == 0)
2713 flags |= PR_READONLY;
2714 if (inst_edge && !(subcode & GTMA_HAS_NO_INSTRUMENTATION))
2715 flags |= PR_INSTRUMENTEDCODE;
2716 if (uninst_edge)
2717 flags |= PR_UNINSTRUMENTEDCODE;
2718 if (subcode & GTMA_IS_OUTER)
2719 region->original_transaction_was_outer = true;
2720 tree t = build_int_cst (tm_state_type, flags);
2721 gimple call = gimple_build_call (tm_start, 1, t);
2722 gimple_call_set_lhs (call, tm_state);
2723 gimple_set_location (call, gimple_location (region->transaction_stmt));
2725 // Replace the GIMPLE_TRANSACTION with the call to BUILT_IN_TM_START.
2726 gimple_stmt_iterator gsi = gsi_last_bb (transaction_bb);
2727 gcc_assert (gsi_stmt (gsi) == region->transaction_stmt);
2728 gsi_insert_before (&gsi, call, GSI_SAME_STMT);
2729 gsi_remove (&gsi, true);
2730 region->transaction_stmt = call;
2733 // Generate log saves.
2734 if (!tm_log_save_addresses.is_empty ())
2735 tm_log_emit_saves (region->entry_block, transaction_bb);
2737 // In the beginning, we've no tests to perform on transaction restart.
2738 // Note that after this point, transaction_bb becomes the "most recent
2739 // block containing tests for the transaction".
2740 region->restart_block = region->entry_block;
2742 // Generate log restores.
2743 if (!tm_log_save_addresses.is_empty ())
2745 basic_block test_bb = create_empty_bb (transaction_bb);
2746 basic_block code_bb = create_empty_bb (test_bb);
2747 basic_block join_bb = create_empty_bb (code_bb);
2748 add_bb_to_loop (test_bb, transaction_bb->loop_father);
2749 add_bb_to_loop (code_bb, transaction_bb->loop_father);
2750 add_bb_to_loop (join_bb, transaction_bb->loop_father);
2751 if (region->restart_block == region->entry_block)
2752 region->restart_block = test_bb;
2754 tree t1 = create_tmp_reg (tm_state_type, NULL);
2755 tree t2 = build_int_cst (tm_state_type, A_RESTORELIVEVARIABLES);
2756 gimple stmt = gimple_build_assign_with_ops (BIT_AND_EXPR, t1,
2757 tm_state, t2);
2758 gimple_stmt_iterator gsi = gsi_last_bb (test_bb);
2759 gsi_insert_after (&gsi, stmt, GSI_CONTINUE_LINKING);
2761 t2 = build_int_cst (tm_state_type, 0);
2762 stmt = gimple_build_cond (NE_EXPR, t1, t2, NULL, NULL);
2763 gsi_insert_after (&gsi, stmt, GSI_CONTINUE_LINKING);
2765 tm_log_emit_restores (region->entry_block, code_bb);
2767 edge ei = make_edge (transaction_bb, test_bb, EDGE_FALLTHRU);
2768 edge et = make_edge (test_bb, code_bb, EDGE_TRUE_VALUE);
2769 edge ef = make_edge (test_bb, join_bb, EDGE_FALSE_VALUE);
2770 redirect_edge_pred (fallthru_edge, join_bb);
2772 join_bb->frequency = test_bb->frequency = transaction_bb->frequency;
2773 join_bb->count = test_bb->count = transaction_bb->count;
2775 ei->probability = PROB_ALWAYS;
2776 et->probability = PROB_LIKELY;
2777 ef->probability = PROB_UNLIKELY;
2778 et->count = apply_probability (test_bb->count, et->probability);
2779 ef->count = apply_probability (test_bb->count, ef->probability);
2781 code_bb->count = et->count;
2782 code_bb->frequency = EDGE_FREQUENCY (et);
2784 transaction_bb = join_bb;
2787 // If we have an ABORT edge, create a test to perform the abort.
2788 if (abort_edge)
2790 basic_block test_bb = create_empty_bb (transaction_bb);
2791 add_bb_to_loop (test_bb, transaction_bb->loop_father);
2792 if (region->restart_block == region->entry_block)
2793 region->restart_block = test_bb;
2795 tree t1 = create_tmp_reg (tm_state_type, NULL);
2796 tree t2 = build_int_cst (tm_state_type, A_ABORTTRANSACTION);
2797 gimple stmt = gimple_build_assign_with_ops (BIT_AND_EXPR, t1,
2798 tm_state, t2);
2799 gimple_stmt_iterator gsi = gsi_last_bb (test_bb);
2800 gsi_insert_after (&gsi, stmt, GSI_CONTINUE_LINKING);
2802 t2 = build_int_cst (tm_state_type, 0);
2803 stmt = gimple_build_cond (NE_EXPR, t1, t2, NULL, NULL);
2804 gsi_insert_after (&gsi, stmt, GSI_CONTINUE_LINKING);
2806 edge ei = make_edge (transaction_bb, test_bb, EDGE_FALLTHRU);
2807 test_bb->frequency = transaction_bb->frequency;
2808 test_bb->count = transaction_bb->count;
2809 ei->probability = PROB_ALWAYS;
2811 // Not abort edge. If both are live, chose one at random as we'll
2812 // we'll be fixing that up below.
2813 redirect_edge_pred (fallthru_edge, test_bb);
2814 fallthru_edge->flags = EDGE_FALSE_VALUE;
2815 fallthru_edge->probability = PROB_VERY_LIKELY;
2816 fallthru_edge->count
2817 = apply_probability (test_bb->count, fallthru_edge->probability);
2819 // Abort/over edge.
2820 redirect_edge_pred (abort_edge, test_bb);
2821 abort_edge->flags = EDGE_TRUE_VALUE;
2822 abort_edge->probability = PROB_VERY_UNLIKELY;
2823 abort_edge->count
2824 = apply_probability (test_bb->count, abort_edge->probability);
2826 transaction_bb = test_bb;
2829 // If we have both instrumented and uninstrumented code paths, select one.
2830 if (inst_edge && uninst_edge)
2832 basic_block test_bb = create_empty_bb (transaction_bb);
2833 add_bb_to_loop (test_bb, transaction_bb->loop_father);
2834 if (region->restart_block == region->entry_block)
2835 region->restart_block = test_bb;
2837 tree t1 = create_tmp_reg (tm_state_type, NULL);
2838 tree t2 = build_int_cst (tm_state_type, A_RUNUNINSTRUMENTEDCODE);
2840 gimple stmt = gimple_build_assign_with_ops (BIT_AND_EXPR, t1,
2841 tm_state, t2);
2842 gimple_stmt_iterator gsi = gsi_last_bb (test_bb);
2843 gsi_insert_after (&gsi, stmt, GSI_CONTINUE_LINKING);
2845 t2 = build_int_cst (tm_state_type, 0);
2846 stmt = gimple_build_cond (NE_EXPR, t1, t2, NULL, NULL);
2847 gsi_insert_after (&gsi, stmt, GSI_CONTINUE_LINKING);
2849 // Create the edge into test_bb first, as we want to copy values
2850 // out of the fallthru edge.
2851 edge e = make_edge (transaction_bb, test_bb, fallthru_edge->flags);
2852 e->probability = fallthru_edge->probability;
2853 test_bb->count = e->count = fallthru_edge->count;
2854 test_bb->frequency = EDGE_FREQUENCY (e);
2856 // Now update the edges to the inst/uninist implementations.
2857 // For now assume that the paths are equally likely. When using HTM,
2858 // we'll try the uninst path first and fallback to inst path if htm
2859 // buffers are exceeded. Without HTM we start with the inst path and
2860 // use the uninst path when falling back to serial mode.
2861 redirect_edge_pred (inst_edge, test_bb);
2862 inst_edge->flags = EDGE_FALSE_VALUE;
2863 inst_edge->probability = REG_BR_PROB_BASE / 2;
2864 inst_edge->count
2865 = apply_probability (test_bb->count, inst_edge->probability);
2867 redirect_edge_pred (uninst_edge, test_bb);
2868 uninst_edge->flags = EDGE_TRUE_VALUE;
2869 uninst_edge->probability = REG_BR_PROB_BASE / 2;
2870 uninst_edge->count
2871 = apply_probability (test_bb->count, uninst_edge->probability);
2874 // If we have no previous special cases, and we have PHIs at the beginning
2875 // of the atomic region, this means we have a loop at the beginning of the
2876 // atomic region that shares the first block. This can cause problems with
2877 // the transaction restart abnormal edges to be added in the tm_edges pass.
2878 // Solve this by adding a new empty block to receive the abnormal edges.
2879 if (region->restart_block == region->entry_block
2880 && phi_nodes (region->entry_block))
2882 basic_block empty_bb = create_empty_bb (transaction_bb);
2883 region->restart_block = empty_bb;
2884 add_bb_to_loop (empty_bb, transaction_bb->loop_father);
2886 redirect_edge_pred (fallthru_edge, empty_bb);
2887 make_edge (transaction_bb, empty_bb, EDGE_FALLTHRU);
2890 return NULL;
2893 /* Generate the temporary to be used for the return value of
2894 BUILT_IN_TM_START. */
2896 static void *
2897 generate_tm_state (struct tm_region *region, void *data ATTRIBUTE_UNUSED)
2899 tree tm_start = builtin_decl_explicit (BUILT_IN_TM_START);
2900 region->tm_state =
2901 create_tmp_reg (TREE_TYPE (TREE_TYPE (tm_start)), "tm_state");
2903 // Reset the subcode, post optimizations. We'll fill this in
2904 // again as we process blocks.
2905 if (region->exit_blocks)
2907 unsigned int subcode
2908 = gimple_transaction_subcode (region->transaction_stmt);
2910 if (subcode & GTMA_DOES_GO_IRREVOCABLE)
2911 subcode &= (GTMA_DECLARATION_MASK | GTMA_DOES_GO_IRREVOCABLE
2912 | GTMA_MAY_ENTER_IRREVOCABLE
2913 | GTMA_HAS_NO_INSTRUMENTATION);
2914 else
2915 subcode &= GTMA_DECLARATION_MASK;
2916 gimple_transaction_set_subcode (region->transaction_stmt, subcode);
2919 return NULL;
2922 // Propagate flags from inner transactions outwards.
2923 static void
2924 propagate_tm_flags_out (struct tm_region *region)
2926 if (region == NULL)
2927 return;
2928 propagate_tm_flags_out (region->inner);
2930 if (region->outer && region->outer->transaction_stmt)
2932 unsigned s = gimple_transaction_subcode (region->transaction_stmt);
2933 s &= (GTMA_HAVE_ABORT | GTMA_HAVE_LOAD | GTMA_HAVE_STORE
2934 | GTMA_MAY_ENTER_IRREVOCABLE);
2935 s |= gimple_transaction_subcode (region->outer->transaction_stmt);
2936 gimple_transaction_set_subcode (region->outer->transaction_stmt, s);
2939 propagate_tm_flags_out (region->next);
2942 /* Entry point to the MARK phase of TM expansion. Here we replace
2943 transactional memory statements with calls to builtins, and function
2944 calls with their transactional clones (if available). But we don't
2945 yet lower GIMPLE_TRANSACTION or add the transaction restart back-edges. */
2947 static unsigned int
2948 execute_tm_mark (void)
2950 pending_edge_inserts_p = false;
2952 expand_regions (all_tm_regions, generate_tm_state, NULL,
2953 /*traverse_clones=*/true);
2955 tm_log_init ();
2957 vec<tm_region_p> bb_regions
2958 = get_bb_regions_instrumented (/*traverse_clones=*/true,
2959 /*include_uninstrumented_p=*/false);
2960 struct tm_region *r;
2961 unsigned i;
2963 // Expand memory operations into calls into the runtime.
2964 // This collects log entries as well.
2965 FOR_EACH_VEC_ELT (bb_regions, i, r)
2967 if (r != NULL)
2969 if (r->transaction_stmt)
2971 unsigned sub = gimple_transaction_subcode (r->transaction_stmt);
2973 /* If we're sure to go irrevocable, there won't be
2974 anything to expand, since the run-time will go
2975 irrevocable right away. */
2976 if (sub & GTMA_DOES_GO_IRREVOCABLE
2977 && sub & GTMA_MAY_ENTER_IRREVOCABLE)
2978 continue;
2980 expand_block_tm (r, BASIC_BLOCK_FOR_FN (cfun, i));
2984 bb_regions.release ();
2986 // Propagate flags from inner transactions outwards.
2987 propagate_tm_flags_out (all_tm_regions);
2989 // Expand GIMPLE_TRANSACTIONs into calls into the runtime.
2990 expand_regions (all_tm_regions, expand_transaction, NULL,
2991 /*traverse_clones=*/false);
2993 tm_log_emit ();
2994 tm_log_delete ();
2996 if (pending_edge_inserts_p)
2997 gsi_commit_edge_inserts ();
2998 free_dominance_info (CDI_DOMINATORS);
2999 return 0;
3002 namespace {
3004 const pass_data pass_data_tm_mark =
3006 GIMPLE_PASS, /* type */
3007 "tmmark", /* name */
3008 OPTGROUP_NONE, /* optinfo_flags */
3009 true, /* has_execute */
3010 TV_TRANS_MEM, /* tv_id */
3011 ( PROP_ssa | PROP_cfg ), /* properties_required */
3012 0, /* properties_provided */
3013 0, /* properties_destroyed */
3014 0, /* todo_flags_start */
3015 TODO_update_ssa, /* todo_flags_finish */
3018 class pass_tm_mark : public gimple_opt_pass
3020 public:
3021 pass_tm_mark (gcc::context *ctxt)
3022 : gimple_opt_pass (pass_data_tm_mark, ctxt)
3025 /* opt_pass methods: */
3026 virtual unsigned int execute (function *) { return execute_tm_mark (); }
3028 }; // class pass_tm_mark
3030 } // anon namespace
3032 gimple_opt_pass *
3033 make_pass_tm_mark (gcc::context *ctxt)
3035 return new pass_tm_mark (ctxt);
3039 /* Create an abnormal edge from STMT at iter, splitting the block
3040 as necessary. Adjust *PNEXT as needed for the split block. */
3042 static inline void
3043 split_bb_make_tm_edge (gimple stmt, basic_block dest_bb,
3044 gimple_stmt_iterator iter, gimple_stmt_iterator *pnext)
3046 basic_block bb = gimple_bb (stmt);
3047 if (!gsi_one_before_end_p (iter))
3049 edge e = split_block (bb, stmt);
3050 *pnext = gsi_start_bb (e->dest);
3052 make_edge (bb, dest_bb, EDGE_ABNORMAL);
3054 // Record the need for the edge for the benefit of the rtl passes.
3055 if (cfun->gimple_df->tm_restart == NULL)
3056 cfun->gimple_df->tm_restart = htab_create_ggc (31, struct_ptr_hash,
3057 struct_ptr_eq, ggc_free);
3059 struct tm_restart_node dummy;
3060 dummy.stmt = stmt;
3061 dummy.label_or_list = gimple_block_label (dest_bb);
3063 void **slot = htab_find_slot (cfun->gimple_df->tm_restart, &dummy, INSERT);
3064 struct tm_restart_node *n = (struct tm_restart_node *) *slot;
3065 if (n == NULL)
3067 n = ggc_alloc<tm_restart_node> ();
3068 *n = dummy;
3070 else
3072 tree old = n->label_or_list;
3073 if (TREE_CODE (old) == LABEL_DECL)
3074 old = tree_cons (NULL, old, NULL);
3075 n->label_or_list = tree_cons (NULL, dummy.label_or_list, old);
3079 /* Split block BB as necessary for every builtin function we added, and
3080 wire up the abnormal back edges implied by the transaction restart. */
3082 static void
3083 expand_block_edges (struct tm_region *const region, basic_block bb)
3085 gimple_stmt_iterator gsi, next_gsi;
3087 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi = next_gsi)
3089 gimple stmt = gsi_stmt (gsi);
3091 next_gsi = gsi;
3092 gsi_next (&next_gsi);
3094 // ??? Shouldn't we split for any non-pure, non-irrevocable function?
3095 if (gimple_code (stmt) != GIMPLE_CALL
3096 || (gimple_call_flags (stmt) & ECF_TM_BUILTIN) == 0)
3097 continue;
3099 if (DECL_FUNCTION_CODE (gimple_call_fndecl (stmt)) == BUILT_IN_TM_ABORT)
3101 // If we have a ``_transaction_cancel [[outer]]'', there is only
3102 // one abnormal edge: to the transaction marked OUTER.
3103 // All compiler-generated instances of BUILT_IN_TM_ABORT have a
3104 // constant argument, which we can examine here. Users invoking
3105 // TM_ABORT directly get what they deserve.
3106 tree arg = gimple_call_arg (stmt, 0);
3107 if (TREE_CODE (arg) == INTEGER_CST
3108 && (TREE_INT_CST_LOW (arg) & AR_OUTERABORT) != 0
3109 && !decl_is_tm_clone (current_function_decl))
3111 // Find the GTMA_IS_OUTER transaction.
3112 for (struct tm_region *o = region; o; o = o->outer)
3113 if (o->original_transaction_was_outer)
3115 split_bb_make_tm_edge (stmt, o->restart_block,
3116 gsi, &next_gsi);
3117 break;
3120 // Otherwise, the front-end should have semantically checked
3121 // outer aborts, but in either case the target region is not
3122 // within this function.
3123 continue;
3126 // Non-outer, TM aborts have an abnormal edge to the inner-most
3127 // transaction, the one being aborted;
3128 split_bb_make_tm_edge (stmt, region->restart_block, gsi, &next_gsi);
3131 // All TM builtins have an abnormal edge to the outer-most transaction.
3132 // We never restart inner transactions. For tm clones, we know a-priori
3133 // that the outer-most transaction is outside the function.
3134 if (decl_is_tm_clone (current_function_decl))
3135 continue;
3137 if (cfun->gimple_df->tm_restart == NULL)
3138 cfun->gimple_df->tm_restart
3139 = htab_create_ggc (31, struct_ptr_hash, struct_ptr_eq, ggc_free);
3141 // All TM builtins have an abnormal edge to the outer-most transaction.
3142 // We never restart inner transactions.
3143 for (struct tm_region *o = region; o; o = o->outer)
3144 if (!o->outer)
3146 split_bb_make_tm_edge (stmt, o->restart_block, gsi, &next_gsi);
3147 break;
3150 // Delete any tail-call annotation that may have been added.
3151 // The tail-call pass may have mis-identified the commit as being
3152 // a candidate because we had not yet added this restart edge.
3153 gimple_call_set_tail (stmt, false);
3157 /* Entry point to the final expansion of transactional nodes. */
3159 namespace {
3161 const pass_data pass_data_tm_edges =
3163 GIMPLE_PASS, /* type */
3164 "tmedge", /* name */
3165 OPTGROUP_NONE, /* optinfo_flags */
3166 true, /* has_execute */
3167 TV_TRANS_MEM, /* tv_id */
3168 ( PROP_ssa | PROP_cfg ), /* properties_required */
3169 0, /* properties_provided */
3170 0, /* properties_destroyed */
3171 0, /* todo_flags_start */
3172 TODO_update_ssa, /* todo_flags_finish */
3175 class pass_tm_edges : public gimple_opt_pass
3177 public:
3178 pass_tm_edges (gcc::context *ctxt)
3179 : gimple_opt_pass (pass_data_tm_edges, ctxt)
3182 /* opt_pass methods: */
3183 virtual unsigned int execute (function *);
3185 }; // class pass_tm_edges
3187 unsigned int
3188 pass_tm_edges::execute (function *fun)
3190 vec<tm_region_p> bb_regions
3191 = get_bb_regions_instrumented (/*traverse_clones=*/false,
3192 /*include_uninstrumented_p=*/true);
3193 struct tm_region *r;
3194 unsigned i;
3196 FOR_EACH_VEC_ELT (bb_regions, i, r)
3197 if (r != NULL)
3198 expand_block_edges (r, BASIC_BLOCK_FOR_FN (fun, i));
3200 bb_regions.release ();
3202 /* We've got to release the dominance info now, to indicate that it
3203 must be rebuilt completely. Otherwise we'll crash trying to update
3204 the SSA web in the TODO section following this pass. */
3205 free_dominance_info (CDI_DOMINATORS);
3206 bitmap_obstack_release (&tm_obstack);
3207 all_tm_regions = NULL;
3209 return 0;
3212 } // anon namespace
3214 gimple_opt_pass *
3215 make_pass_tm_edges (gcc::context *ctxt)
3217 return new pass_tm_edges (ctxt);
3220 /* Helper function for expand_regions. Expand REGION and recurse to
3221 the inner region. Call CALLBACK on each region. CALLBACK returns
3222 NULL to continue the traversal, otherwise a non-null value which
3223 this function will return as well. TRAVERSE_CLONES is true if we
3224 should traverse transactional clones. */
3226 static void *
3227 expand_regions_1 (struct tm_region *region,
3228 void *(*callback)(struct tm_region *, void *),
3229 void *data,
3230 bool traverse_clones)
3232 void *retval = NULL;
3233 if (region->exit_blocks
3234 || (traverse_clones && decl_is_tm_clone (current_function_decl)))
3236 retval = callback (region, data);
3237 if (retval)
3238 return retval;
3240 if (region->inner)
3242 retval = expand_regions (region->inner, callback, data, traverse_clones);
3243 if (retval)
3244 return retval;
3246 return retval;
3249 /* Traverse the regions enclosed and including REGION. Execute
3250 CALLBACK for each region, passing DATA. CALLBACK returns NULL to
3251 continue the traversal, otherwise a non-null value which this
3252 function will return as well. TRAVERSE_CLONES is true if we should
3253 traverse transactional clones. */
3255 static void *
3256 expand_regions (struct tm_region *region,
3257 void *(*callback)(struct tm_region *, void *),
3258 void *data,
3259 bool traverse_clones)
3261 void *retval = NULL;
3262 while (region)
3264 retval = expand_regions_1 (region, callback, data, traverse_clones);
3265 if (retval)
3266 return retval;
3267 region = region->next;
3269 return retval;
3273 /* A unique TM memory operation. */
3274 typedef struct tm_memop
3276 /* Unique ID that all memory operations to the same location have. */
3277 unsigned int value_id;
3278 /* Address of load/store. */
3279 tree addr;
3280 } *tm_memop_t;
3282 /* TM memory operation hashtable helpers. */
3284 struct tm_memop_hasher : typed_free_remove <tm_memop>
3286 typedef tm_memop value_type;
3287 typedef tm_memop compare_type;
3288 static inline hashval_t hash (const value_type *);
3289 static inline bool equal (const value_type *, const compare_type *);
3292 /* Htab support. Return a hash value for a `tm_memop'. */
3293 inline hashval_t
3294 tm_memop_hasher::hash (const value_type *mem)
3296 tree addr = mem->addr;
3297 /* We drill down to the SSA_NAME/DECL for the hash, but equality is
3298 actually done with operand_equal_p (see tm_memop_eq). */
3299 if (TREE_CODE (addr) == ADDR_EXPR)
3300 addr = TREE_OPERAND (addr, 0);
3301 return iterative_hash_expr (addr, 0);
3304 /* Htab support. Return true if two tm_memop's are the same. */
3305 inline bool
3306 tm_memop_hasher::equal (const value_type *mem1, const compare_type *mem2)
3308 return operand_equal_p (mem1->addr, mem2->addr, 0);
3311 /* Sets for solving data flow equations in the memory optimization pass. */
3312 struct tm_memopt_bitmaps
3314 /* Stores available to this BB upon entry. Basically, stores that
3315 dominate this BB. */
3316 bitmap store_avail_in;
3317 /* Stores available at the end of this BB. */
3318 bitmap store_avail_out;
3319 bitmap store_antic_in;
3320 bitmap store_antic_out;
3321 /* Reads available to this BB upon entry. Basically, reads that
3322 dominate this BB. */
3323 bitmap read_avail_in;
3324 /* Reads available at the end of this BB. */
3325 bitmap read_avail_out;
3326 /* Reads performed in this BB. */
3327 bitmap read_local;
3328 /* Writes performed in this BB. */
3329 bitmap store_local;
3331 /* Temporary storage for pass. */
3332 /* Is the current BB in the worklist? */
3333 bool avail_in_worklist_p;
3334 /* Have we visited this BB? */
3335 bool visited_p;
3338 static bitmap_obstack tm_memopt_obstack;
3340 /* Unique counter for TM loads and stores. Loads and stores of the
3341 same address get the same ID. */
3342 static unsigned int tm_memopt_value_id;
3343 static hash_table <tm_memop_hasher> tm_memopt_value_numbers;
3345 #define STORE_AVAIL_IN(BB) \
3346 ((struct tm_memopt_bitmaps *) ((BB)->aux))->store_avail_in
3347 #define STORE_AVAIL_OUT(BB) \
3348 ((struct tm_memopt_bitmaps *) ((BB)->aux))->store_avail_out
3349 #define STORE_ANTIC_IN(BB) \
3350 ((struct tm_memopt_bitmaps *) ((BB)->aux))->store_antic_in
3351 #define STORE_ANTIC_OUT(BB) \
3352 ((struct tm_memopt_bitmaps *) ((BB)->aux))->store_antic_out
3353 #define READ_AVAIL_IN(BB) \
3354 ((struct tm_memopt_bitmaps *) ((BB)->aux))->read_avail_in
3355 #define READ_AVAIL_OUT(BB) \
3356 ((struct tm_memopt_bitmaps *) ((BB)->aux))->read_avail_out
3357 #define READ_LOCAL(BB) \
3358 ((struct tm_memopt_bitmaps *) ((BB)->aux))->read_local
3359 #define STORE_LOCAL(BB) \
3360 ((struct tm_memopt_bitmaps *) ((BB)->aux))->store_local
3361 #define AVAIL_IN_WORKLIST_P(BB) \
3362 ((struct tm_memopt_bitmaps *) ((BB)->aux))->avail_in_worklist_p
3363 #define BB_VISITED_P(BB) \
3364 ((struct tm_memopt_bitmaps *) ((BB)->aux))->visited_p
3366 /* Given a TM load/store in STMT, return the value number for the address
3367 it accesses. */
3369 static unsigned int
3370 tm_memopt_value_number (gimple stmt, enum insert_option op)
3372 struct tm_memop tmpmem, *mem;
3373 tm_memop **slot;
3375 gcc_assert (is_tm_load (stmt) || is_tm_store (stmt));
3376 tmpmem.addr = gimple_call_arg (stmt, 0);
3377 slot = tm_memopt_value_numbers.find_slot (&tmpmem, op);
3378 if (*slot)
3379 mem = *slot;
3380 else if (op == INSERT)
3382 mem = XNEW (struct tm_memop);
3383 *slot = mem;
3384 mem->value_id = tm_memopt_value_id++;
3385 mem->addr = tmpmem.addr;
3387 else
3388 gcc_unreachable ();
3389 return mem->value_id;
3392 /* Accumulate TM memory operations in BB into STORE_LOCAL and READ_LOCAL. */
3394 static void
3395 tm_memopt_accumulate_memops (basic_block bb)
3397 gimple_stmt_iterator gsi;
3399 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
3401 gimple stmt = gsi_stmt (gsi);
3402 bitmap bits;
3403 unsigned int loc;
3405 if (is_tm_store (stmt))
3406 bits = STORE_LOCAL (bb);
3407 else if (is_tm_load (stmt))
3408 bits = READ_LOCAL (bb);
3409 else
3410 continue;
3412 loc = tm_memopt_value_number (stmt, INSERT);
3413 bitmap_set_bit (bits, loc);
3414 if (dump_file)
3416 fprintf (dump_file, "TM memopt (%s): value num=%d, BB=%d, addr=",
3417 is_tm_load (stmt) ? "LOAD" : "STORE", loc,
3418 gimple_bb (stmt)->index);
3419 print_generic_expr (dump_file, gimple_call_arg (stmt, 0), 0);
3420 fprintf (dump_file, "\n");
3425 /* Prettily dump one of the memopt sets. BITS is the bitmap to dump. */
3427 static void
3428 dump_tm_memopt_set (const char *set_name, bitmap bits)
3430 unsigned i;
3431 bitmap_iterator bi;
3432 const char *comma = "";
3434 fprintf (dump_file, "TM memopt: %s: [", set_name);
3435 EXECUTE_IF_SET_IN_BITMAP (bits, 0, i, bi)
3437 hash_table <tm_memop_hasher>::iterator hi;
3438 struct tm_memop *mem = NULL;
3440 /* Yeah, yeah, yeah. Whatever. This is just for debugging. */
3441 FOR_EACH_HASH_TABLE_ELEMENT (tm_memopt_value_numbers, mem, tm_memop_t, hi)
3442 if (mem->value_id == i)
3443 break;
3444 gcc_assert (mem->value_id == i);
3445 fprintf (dump_file, "%s", comma);
3446 comma = ", ";
3447 print_generic_expr (dump_file, mem->addr, 0);
3449 fprintf (dump_file, "]\n");
3452 /* Prettily dump all of the memopt sets in BLOCKS. */
3454 static void
3455 dump_tm_memopt_sets (vec<basic_block> blocks)
3457 size_t i;
3458 basic_block bb;
3460 for (i = 0; blocks.iterate (i, &bb); ++i)
3462 fprintf (dump_file, "------------BB %d---------\n", bb->index);
3463 dump_tm_memopt_set ("STORE_LOCAL", STORE_LOCAL (bb));
3464 dump_tm_memopt_set ("READ_LOCAL", READ_LOCAL (bb));
3465 dump_tm_memopt_set ("STORE_AVAIL_IN", STORE_AVAIL_IN (bb));
3466 dump_tm_memopt_set ("STORE_AVAIL_OUT", STORE_AVAIL_OUT (bb));
3467 dump_tm_memopt_set ("READ_AVAIL_IN", READ_AVAIL_IN (bb));
3468 dump_tm_memopt_set ("READ_AVAIL_OUT", READ_AVAIL_OUT (bb));
3472 /* Compute {STORE,READ}_AVAIL_IN for the basic block BB. */
3474 static void
3475 tm_memopt_compute_avin (basic_block bb)
3477 edge e;
3478 unsigned ix;
3480 /* Seed with the AVOUT of any predecessor. */
3481 for (ix = 0; ix < EDGE_COUNT (bb->preds); ix++)
3483 e = EDGE_PRED (bb, ix);
3484 /* Make sure we have already visited this BB, and is thus
3485 initialized.
3487 If e->src->aux is NULL, this predecessor is actually on an
3488 enclosing transaction. We only care about the current
3489 transaction, so ignore it. */
3490 if (e->src->aux && BB_VISITED_P (e->src))
3492 bitmap_copy (STORE_AVAIL_IN (bb), STORE_AVAIL_OUT (e->src));
3493 bitmap_copy (READ_AVAIL_IN (bb), READ_AVAIL_OUT (e->src));
3494 break;
3498 for (; ix < EDGE_COUNT (bb->preds); ix++)
3500 e = EDGE_PRED (bb, ix);
3501 if (e->src->aux && BB_VISITED_P (e->src))
3503 bitmap_and_into (STORE_AVAIL_IN (bb), STORE_AVAIL_OUT (e->src));
3504 bitmap_and_into (READ_AVAIL_IN (bb), READ_AVAIL_OUT (e->src));
3508 BB_VISITED_P (bb) = true;
3511 /* Compute the STORE_ANTIC_IN for the basic block BB. */
3513 static void
3514 tm_memopt_compute_antin (basic_block bb)
3516 edge e;
3517 unsigned ix;
3519 /* Seed with the ANTIC_OUT of any successor. */
3520 for (ix = 0; ix < EDGE_COUNT (bb->succs); ix++)
3522 e = EDGE_SUCC (bb, ix);
3523 /* Make sure we have already visited this BB, and is thus
3524 initialized. */
3525 if (BB_VISITED_P (e->dest))
3527 bitmap_copy (STORE_ANTIC_IN (bb), STORE_ANTIC_OUT (e->dest));
3528 break;
3532 for (; ix < EDGE_COUNT (bb->succs); ix++)
3534 e = EDGE_SUCC (bb, ix);
3535 if (BB_VISITED_P (e->dest))
3536 bitmap_and_into (STORE_ANTIC_IN (bb), STORE_ANTIC_OUT (e->dest));
3539 BB_VISITED_P (bb) = true;
3542 /* Compute the AVAIL sets for every basic block in BLOCKS.
3544 We compute {STORE,READ}_AVAIL_{OUT,IN} as follows:
3546 AVAIL_OUT[bb] = union (AVAIL_IN[bb], LOCAL[bb])
3547 AVAIL_IN[bb] = intersect (AVAIL_OUT[predecessors])
3549 This is basically what we do in lcm's compute_available(), but here
3550 we calculate two sets of sets (one for STOREs and one for READs),
3551 and we work on a region instead of the entire CFG.
3553 REGION is the TM region.
3554 BLOCKS are the basic blocks in the region. */
3556 static void
3557 tm_memopt_compute_available (struct tm_region *region,
3558 vec<basic_block> blocks)
3560 edge e;
3561 basic_block *worklist, *qin, *qout, *qend, bb;
3562 unsigned int qlen, i;
3563 edge_iterator ei;
3564 bool changed;
3566 /* Allocate a worklist array/queue. Entries are only added to the
3567 list if they were not already on the list. So the size is
3568 bounded by the number of basic blocks in the region. */
3569 qlen = blocks.length () - 1;
3570 qin = qout = worklist =
3571 XNEWVEC (basic_block, qlen);
3573 /* Put every block in the region on the worklist. */
3574 for (i = 0; blocks.iterate (i, &bb); ++i)
3576 /* Seed AVAIL_OUT with the LOCAL set. */
3577 bitmap_ior_into (STORE_AVAIL_OUT (bb), STORE_LOCAL (bb));
3578 bitmap_ior_into (READ_AVAIL_OUT (bb), READ_LOCAL (bb));
3580 AVAIL_IN_WORKLIST_P (bb) = true;
3581 /* No need to insert the entry block, since it has an AVIN of
3582 null, and an AVOUT that has already been seeded in. */
3583 if (bb != region->entry_block)
3584 *qin++ = bb;
3587 /* The entry block has been initialized with the local sets. */
3588 BB_VISITED_P (region->entry_block) = true;
3590 qin = worklist;
3591 qend = &worklist[qlen];
3593 /* Iterate until the worklist is empty. */
3594 while (qlen)
3596 /* Take the first entry off the worklist. */
3597 bb = *qout++;
3598 qlen--;
3600 if (qout >= qend)
3601 qout = worklist;
3603 /* This block can be added to the worklist again if necessary. */
3604 AVAIL_IN_WORKLIST_P (bb) = false;
3605 tm_memopt_compute_avin (bb);
3607 /* Note: We do not add the LOCAL sets here because we already
3608 seeded the AVAIL_OUT sets with them. */
3609 changed = bitmap_ior_into (STORE_AVAIL_OUT (bb), STORE_AVAIL_IN (bb));
3610 changed |= bitmap_ior_into (READ_AVAIL_OUT (bb), READ_AVAIL_IN (bb));
3611 if (changed
3612 && (region->exit_blocks == NULL
3613 || !bitmap_bit_p (region->exit_blocks, bb->index)))
3614 /* If the out state of this block changed, then we need to add
3615 its successors to the worklist if they are not already in. */
3616 FOR_EACH_EDGE (e, ei, bb->succs)
3617 if (!AVAIL_IN_WORKLIST_P (e->dest)
3618 && e->dest != EXIT_BLOCK_PTR_FOR_FN (cfun))
3620 *qin++ = e->dest;
3621 AVAIL_IN_WORKLIST_P (e->dest) = true;
3622 qlen++;
3624 if (qin >= qend)
3625 qin = worklist;
3629 free (worklist);
3631 if (dump_file)
3632 dump_tm_memopt_sets (blocks);
3635 /* Compute ANTIC sets for every basic block in BLOCKS.
3637 We compute STORE_ANTIC_OUT as follows:
3639 STORE_ANTIC_OUT[bb] = union(STORE_ANTIC_IN[bb], STORE_LOCAL[bb])
3640 STORE_ANTIC_IN[bb] = intersect(STORE_ANTIC_OUT[successors])
3642 REGION is the TM region.
3643 BLOCKS are the basic blocks in the region. */
3645 static void
3646 tm_memopt_compute_antic (struct tm_region *region,
3647 vec<basic_block> blocks)
3649 edge e;
3650 basic_block *worklist, *qin, *qout, *qend, bb;
3651 unsigned int qlen;
3652 int i;
3653 edge_iterator ei;
3655 /* Allocate a worklist array/queue. Entries are only added to the
3656 list if they were not already on the list. So the size is
3657 bounded by the number of basic blocks in the region. */
3658 qin = qout = worklist = XNEWVEC (basic_block, blocks.length ());
3660 for (qlen = 0, i = blocks.length () - 1; i >= 0; --i)
3662 bb = blocks[i];
3664 /* Seed ANTIC_OUT with the LOCAL set. */
3665 bitmap_ior_into (STORE_ANTIC_OUT (bb), STORE_LOCAL (bb));
3667 /* Put every block in the region on the worklist. */
3668 AVAIL_IN_WORKLIST_P (bb) = true;
3669 /* No need to insert exit blocks, since their ANTIC_IN is NULL,
3670 and their ANTIC_OUT has already been seeded in. */
3671 if (region->exit_blocks
3672 && !bitmap_bit_p (region->exit_blocks, bb->index))
3674 qlen++;
3675 *qin++ = bb;
3679 /* The exit blocks have been initialized with the local sets. */
3680 if (region->exit_blocks)
3682 unsigned int i;
3683 bitmap_iterator bi;
3684 EXECUTE_IF_SET_IN_BITMAP (region->exit_blocks, 0, i, bi)
3685 BB_VISITED_P (BASIC_BLOCK_FOR_FN (cfun, i)) = true;
3688 qin = worklist;
3689 qend = &worklist[qlen];
3691 /* Iterate until the worklist is empty. */
3692 while (qlen)
3694 /* Take the first entry off the worklist. */
3695 bb = *qout++;
3696 qlen--;
3698 if (qout >= qend)
3699 qout = worklist;
3701 /* This block can be added to the worklist again if necessary. */
3702 AVAIL_IN_WORKLIST_P (bb) = false;
3703 tm_memopt_compute_antin (bb);
3705 /* Note: We do not add the LOCAL sets here because we already
3706 seeded the ANTIC_OUT sets with them. */
3707 if (bitmap_ior_into (STORE_ANTIC_OUT (bb), STORE_ANTIC_IN (bb))
3708 && bb != region->entry_block)
3709 /* If the out state of this block changed, then we need to add
3710 its predecessors to the worklist if they are not already in. */
3711 FOR_EACH_EDGE (e, ei, bb->preds)
3712 if (!AVAIL_IN_WORKLIST_P (e->src))
3714 *qin++ = e->src;
3715 AVAIL_IN_WORKLIST_P (e->src) = true;
3716 qlen++;
3718 if (qin >= qend)
3719 qin = worklist;
3723 free (worklist);
3725 if (dump_file)
3726 dump_tm_memopt_sets (blocks);
3729 /* Offsets of load variants from TM_LOAD. For example,
3730 BUILT_IN_TM_LOAD_RAR* is an offset of 1 from BUILT_IN_TM_LOAD*.
3731 See gtm-builtins.def. */
3732 #define TRANSFORM_RAR 1
3733 #define TRANSFORM_RAW 2
3734 #define TRANSFORM_RFW 3
3735 /* Offsets of store variants from TM_STORE. */
3736 #define TRANSFORM_WAR 1
3737 #define TRANSFORM_WAW 2
3739 /* Inform about a load/store optimization. */
3741 static void
3742 dump_tm_memopt_transform (gimple stmt)
3744 if (dump_file)
3746 fprintf (dump_file, "TM memopt: transforming: ");
3747 print_gimple_stmt (dump_file, stmt, 0, 0);
3748 fprintf (dump_file, "\n");
3752 /* Perform a read/write optimization. Replaces the TM builtin in STMT
3753 by a builtin that is OFFSET entries down in the builtins table in
3754 gtm-builtins.def. */
3756 static void
3757 tm_memopt_transform_stmt (unsigned int offset,
3758 gimple stmt,
3759 gimple_stmt_iterator *gsi)
3761 tree fn = gimple_call_fn (stmt);
3762 gcc_assert (TREE_CODE (fn) == ADDR_EXPR);
3763 TREE_OPERAND (fn, 0)
3764 = builtin_decl_explicit ((enum built_in_function)
3765 (DECL_FUNCTION_CODE (TREE_OPERAND (fn, 0))
3766 + offset));
3767 gimple_call_set_fn (stmt, fn);
3768 gsi_replace (gsi, stmt, true);
3769 dump_tm_memopt_transform (stmt);
3772 /* Perform the actual TM memory optimization transformations in the
3773 basic blocks in BLOCKS. */
3775 static void
3776 tm_memopt_transform_blocks (vec<basic_block> blocks)
3778 size_t i;
3779 basic_block bb;
3780 gimple_stmt_iterator gsi;
3782 for (i = 0; blocks.iterate (i, &bb); ++i)
3784 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
3786 gimple stmt = gsi_stmt (gsi);
3787 bitmap read_avail = READ_AVAIL_IN (bb);
3788 bitmap store_avail = STORE_AVAIL_IN (bb);
3789 bitmap store_antic = STORE_ANTIC_OUT (bb);
3790 unsigned int loc;
3792 if (is_tm_simple_load (stmt))
3794 loc = tm_memopt_value_number (stmt, NO_INSERT);
3795 if (store_avail && bitmap_bit_p (store_avail, loc))
3796 tm_memopt_transform_stmt (TRANSFORM_RAW, stmt, &gsi);
3797 else if (store_antic && bitmap_bit_p (store_antic, loc))
3799 tm_memopt_transform_stmt (TRANSFORM_RFW, stmt, &gsi);
3800 bitmap_set_bit (store_avail, loc);
3802 else if (read_avail && bitmap_bit_p (read_avail, loc))
3803 tm_memopt_transform_stmt (TRANSFORM_RAR, stmt, &gsi);
3804 else
3805 bitmap_set_bit (read_avail, loc);
3807 else if (is_tm_simple_store (stmt))
3809 loc = tm_memopt_value_number (stmt, NO_INSERT);
3810 if (store_avail && bitmap_bit_p (store_avail, loc))
3811 tm_memopt_transform_stmt (TRANSFORM_WAW, stmt, &gsi);
3812 else
3814 if (read_avail && bitmap_bit_p (read_avail, loc))
3815 tm_memopt_transform_stmt (TRANSFORM_WAR, stmt, &gsi);
3816 bitmap_set_bit (store_avail, loc);
3823 /* Return a new set of bitmaps for a BB. */
3825 static struct tm_memopt_bitmaps *
3826 tm_memopt_init_sets (void)
3828 struct tm_memopt_bitmaps *b
3829 = XOBNEW (&tm_memopt_obstack.obstack, struct tm_memopt_bitmaps);
3830 b->store_avail_in = BITMAP_ALLOC (&tm_memopt_obstack);
3831 b->store_avail_out = BITMAP_ALLOC (&tm_memopt_obstack);
3832 b->store_antic_in = BITMAP_ALLOC (&tm_memopt_obstack);
3833 b->store_antic_out = BITMAP_ALLOC (&tm_memopt_obstack);
3834 b->store_avail_out = BITMAP_ALLOC (&tm_memopt_obstack);
3835 b->read_avail_in = BITMAP_ALLOC (&tm_memopt_obstack);
3836 b->read_avail_out = BITMAP_ALLOC (&tm_memopt_obstack);
3837 b->read_local = BITMAP_ALLOC (&tm_memopt_obstack);
3838 b->store_local = BITMAP_ALLOC (&tm_memopt_obstack);
3839 return b;
3842 /* Free sets computed for each BB. */
3844 static void
3845 tm_memopt_free_sets (vec<basic_block> blocks)
3847 size_t i;
3848 basic_block bb;
3850 for (i = 0; blocks.iterate (i, &bb); ++i)
3851 bb->aux = NULL;
3854 /* Clear the visited bit for every basic block in BLOCKS. */
3856 static void
3857 tm_memopt_clear_visited (vec<basic_block> blocks)
3859 size_t i;
3860 basic_block bb;
3862 for (i = 0; blocks.iterate (i, &bb); ++i)
3863 BB_VISITED_P (bb) = false;
3866 /* Replace TM load/stores with hints for the runtime. We handle
3867 things like read-after-write, write-after-read, read-after-read,
3868 read-for-write, etc. */
3870 static unsigned int
3871 execute_tm_memopt (void)
3873 struct tm_region *region;
3874 vec<basic_block> bbs;
3876 tm_memopt_value_id = 0;
3877 tm_memopt_value_numbers.create (10);
3879 for (region = all_tm_regions; region; region = region->next)
3881 /* All the TM stores/loads in the current region. */
3882 size_t i;
3883 basic_block bb;
3885 bitmap_obstack_initialize (&tm_memopt_obstack);
3887 /* Save all BBs for the current region. */
3888 bbs = get_tm_region_blocks (region->entry_block,
3889 region->exit_blocks,
3890 region->irr_blocks,
3891 NULL,
3892 false);
3894 /* Collect all the memory operations. */
3895 for (i = 0; bbs.iterate (i, &bb); ++i)
3897 bb->aux = tm_memopt_init_sets ();
3898 tm_memopt_accumulate_memops (bb);
3901 /* Solve data flow equations and transform each block accordingly. */
3902 tm_memopt_clear_visited (bbs);
3903 tm_memopt_compute_available (region, bbs);
3904 tm_memopt_clear_visited (bbs);
3905 tm_memopt_compute_antic (region, bbs);
3906 tm_memopt_transform_blocks (bbs);
3908 tm_memopt_free_sets (bbs);
3909 bbs.release ();
3910 bitmap_obstack_release (&tm_memopt_obstack);
3911 tm_memopt_value_numbers.empty ();
3914 tm_memopt_value_numbers.dispose ();
3915 return 0;
3918 namespace {
3920 const pass_data pass_data_tm_memopt =
3922 GIMPLE_PASS, /* type */
3923 "tmmemopt", /* name */
3924 OPTGROUP_NONE, /* optinfo_flags */
3925 true, /* has_execute */
3926 TV_TRANS_MEM, /* tv_id */
3927 ( PROP_ssa | PROP_cfg ), /* properties_required */
3928 0, /* properties_provided */
3929 0, /* properties_destroyed */
3930 0, /* todo_flags_start */
3931 0, /* todo_flags_finish */
3934 class pass_tm_memopt : public gimple_opt_pass
3936 public:
3937 pass_tm_memopt (gcc::context *ctxt)
3938 : gimple_opt_pass (pass_data_tm_memopt, ctxt)
3941 /* opt_pass methods: */
3942 virtual bool gate (function *) { return flag_tm && optimize > 0; }
3943 virtual unsigned int execute (function *) { return execute_tm_memopt (); }
3945 }; // class pass_tm_memopt
3947 } // anon namespace
3949 gimple_opt_pass *
3950 make_pass_tm_memopt (gcc::context *ctxt)
3952 return new pass_tm_memopt (ctxt);
3956 /* Interprocedual analysis for the creation of transactional clones.
3957 The aim of this pass is to find which functions are referenced in
3958 a non-irrevocable transaction context, and for those over which
3959 we have control (or user directive), create a version of the
3960 function which uses only the transactional interface to reference
3961 protected memories. This analysis proceeds in several steps:
3963 (1) Collect the set of all possible transactional clones:
3965 (a) For all local public functions marked tm_callable, push
3966 it onto the tm_callee queue.
3968 (b) For all local functions, scan for calls in transaction blocks.
3969 Push the caller and callee onto the tm_caller and tm_callee
3970 queues. Count the number of callers for each callee.
3972 (c) For each local function on the callee list, assume we will
3973 create a transactional clone. Push *all* calls onto the
3974 callee queues; count the number of clone callers separately
3975 to the number of original callers.
3977 (2) Propagate irrevocable status up the dominator tree:
3979 (a) Any external function on the callee list that is not marked
3980 tm_callable is irrevocable. Push all callers of such onto
3981 a worklist.
3983 (b) For each function on the worklist, mark each block that
3984 contains an irrevocable call. Use the AND operator to
3985 propagate that mark up the dominator tree.
3987 (c) If we reach the entry block for a possible transactional
3988 clone, then the transactional clone is irrevocable, and
3989 we should not create the clone after all. Push all
3990 callers onto the worklist.
3992 (d) Place tm_irrevocable calls at the beginning of the relevant
3993 blocks. Special case here is the entry block for the entire
3994 transaction region; there we mark it GTMA_DOES_GO_IRREVOCABLE for
3995 the library to begin the region in serial mode. Decrement
3996 the call count for all callees in the irrevocable region.
3998 (3) Create the transactional clones:
4000 Any tm_callee that still has a non-zero call count is cloned.
4003 /* This structure is stored in the AUX field of each cgraph_node. */
4004 struct tm_ipa_cg_data
4006 /* The clone of the function that got created. */
4007 struct cgraph_node *clone;
4009 /* The tm regions in the normal function. */
4010 struct tm_region *all_tm_regions;
4012 /* The blocks of the normal/clone functions that contain irrevocable
4013 calls, or blocks that are post-dominated by irrevocable calls. */
4014 bitmap irrevocable_blocks_normal;
4015 bitmap irrevocable_blocks_clone;
4017 /* The blocks of the normal function that are involved in transactions. */
4018 bitmap transaction_blocks_normal;
4020 /* The number of callers to the transactional clone of this function
4021 from normal and transactional clones respectively. */
4022 unsigned tm_callers_normal;
4023 unsigned tm_callers_clone;
4025 /* True if all calls to this function's transactional clone
4026 are irrevocable. Also automatically true if the function
4027 has no transactional clone. */
4028 bool is_irrevocable;
4030 /* Flags indicating the presence of this function in various queues. */
4031 bool in_callee_queue;
4032 bool in_worklist;
4034 /* Flags indicating the kind of scan desired while in the worklist. */
4035 bool want_irr_scan_normal;
4038 typedef vec<cgraph_node_ptr> cgraph_node_queue;
4040 /* Return the ipa data associated with NODE, allocating zeroed memory
4041 if necessary. TRAVERSE_ALIASES is true if we must traverse aliases
4042 and set *NODE accordingly. */
4044 static struct tm_ipa_cg_data *
4045 get_cg_data (struct cgraph_node **node, bool traverse_aliases)
4047 struct tm_ipa_cg_data *d;
4049 if (traverse_aliases && (*node)->alias)
4050 *node = cgraph_alias_target (*node);
4052 d = (struct tm_ipa_cg_data *) (*node)->aux;
4054 if (d == NULL)
4056 d = (struct tm_ipa_cg_data *)
4057 obstack_alloc (&tm_obstack.obstack, sizeof (*d));
4058 (*node)->aux = (void *) d;
4059 memset (d, 0, sizeof (*d));
4062 return d;
4065 /* Add NODE to the end of QUEUE, unless IN_QUEUE_P indicates that
4066 it is already present. */
4068 static void
4069 maybe_push_queue (struct cgraph_node *node,
4070 cgraph_node_queue *queue_p, bool *in_queue_p)
4072 if (!*in_queue_p)
4074 *in_queue_p = true;
4075 queue_p->safe_push (node);
4079 /* Duplicate the basic blocks in QUEUE for use in the uninstrumented
4080 code path. QUEUE are the basic blocks inside the transaction
4081 represented in REGION.
4083 Later in split_code_paths() we will add the conditional to choose
4084 between the two alternatives. */
4086 static void
4087 ipa_uninstrument_transaction (struct tm_region *region,
4088 vec<basic_block> queue)
4090 gimple transaction = region->transaction_stmt;
4091 basic_block transaction_bb = gimple_bb (transaction);
4092 int n = queue.length ();
4093 basic_block *new_bbs = XNEWVEC (basic_block, n);
4095 copy_bbs (queue.address (), n, new_bbs, NULL, 0, NULL, NULL, transaction_bb,
4096 true);
4097 edge e = make_edge (transaction_bb, new_bbs[0], EDGE_TM_UNINSTRUMENTED);
4098 add_phi_args_after_copy (new_bbs, n, e);
4100 // Now we will have a GIMPLE_ATOMIC with 3 possible edges out of it.
4101 // a) EDGE_FALLTHRU into the transaction
4102 // b) EDGE_TM_ABORT out of the transaction
4103 // c) EDGE_TM_UNINSTRUMENTED into the uninstrumented blocks.
4105 free (new_bbs);
4108 /* A subroutine of ipa_tm_scan_calls_transaction and ipa_tm_scan_calls_clone.
4109 Queue all callees within block BB. */
4111 static void
4112 ipa_tm_scan_calls_block (cgraph_node_queue *callees_p,
4113 basic_block bb, bool for_clone)
4115 gimple_stmt_iterator gsi;
4117 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
4119 gimple stmt = gsi_stmt (gsi);
4120 if (is_gimple_call (stmt) && !is_tm_pure_call (stmt))
4122 tree fndecl = gimple_call_fndecl (stmt);
4123 if (fndecl)
4125 struct tm_ipa_cg_data *d;
4126 unsigned *pcallers;
4127 struct cgraph_node *node;
4129 if (is_tm_ending_fndecl (fndecl))
4130 continue;
4131 if (find_tm_replacement_function (fndecl))
4132 continue;
4134 node = cgraph_get_node (fndecl);
4135 gcc_assert (node != NULL);
4136 d = get_cg_data (&node, true);
4138 pcallers = (for_clone ? &d->tm_callers_clone
4139 : &d->tm_callers_normal);
4140 *pcallers += 1;
4142 maybe_push_queue (node, callees_p, &d->in_callee_queue);
4148 /* Scan all calls in NODE that are within a transaction region,
4149 and push the resulting nodes into the callee queue. */
4151 static void
4152 ipa_tm_scan_calls_transaction (struct tm_ipa_cg_data *d,
4153 cgraph_node_queue *callees_p)
4155 struct tm_region *r;
4157 d->transaction_blocks_normal = BITMAP_ALLOC (&tm_obstack);
4158 d->all_tm_regions = all_tm_regions;
4160 for (r = all_tm_regions; r; r = r->next)
4162 vec<basic_block> bbs;
4163 basic_block bb;
4164 unsigned i;
4166 bbs = get_tm_region_blocks (r->entry_block, r->exit_blocks, NULL,
4167 d->transaction_blocks_normal, false);
4169 // Generate the uninstrumented code path for this transaction.
4170 ipa_uninstrument_transaction (r, bbs);
4172 FOR_EACH_VEC_ELT (bbs, i, bb)
4173 ipa_tm_scan_calls_block (callees_p, bb, false);
4175 bbs.release ();
4178 // ??? copy_bbs should maintain cgraph edges for the blocks as it is
4179 // copying them, rather than forcing us to do this externally.
4180 rebuild_cgraph_edges ();
4182 // ??? In ipa_uninstrument_transaction we don't try to update dominators
4183 // because copy_bbs doesn't return a VEC like iterate_fix_dominators expects.
4184 // Instead, just release dominators here so update_ssa recomputes them.
4185 free_dominance_info (CDI_DOMINATORS);
4187 // When building the uninstrumented code path, copy_bbs will have invoked
4188 // create_new_def_for starting an "ssa update context". There is only one
4189 // instance of this context, so resolve ssa updates before moving on to
4190 // the next function.
4191 update_ssa (TODO_update_ssa);
4194 /* Scan all calls in NODE as if this is the transactional clone,
4195 and push the destinations into the callee queue. */
4197 static void
4198 ipa_tm_scan_calls_clone (struct cgraph_node *node,
4199 cgraph_node_queue *callees_p)
4201 struct function *fn = DECL_STRUCT_FUNCTION (node->decl);
4202 basic_block bb;
4204 FOR_EACH_BB_FN (bb, fn)
4205 ipa_tm_scan_calls_block (callees_p, bb, true);
4208 /* The function NODE has been detected to be irrevocable. Push all
4209 of its callers onto WORKLIST for the purpose of re-scanning them. */
4211 static void
4212 ipa_tm_note_irrevocable (struct cgraph_node *node,
4213 cgraph_node_queue *worklist_p)
4215 struct tm_ipa_cg_data *d = get_cg_data (&node, true);
4216 struct cgraph_edge *e;
4218 d->is_irrevocable = true;
4220 for (e = node->callers; e ; e = e->next_caller)
4222 basic_block bb;
4223 struct cgraph_node *caller;
4225 /* Don't examine recursive calls. */
4226 if (e->caller == node)
4227 continue;
4228 /* Even if we think we can go irrevocable, believe the user
4229 above all. */
4230 if (is_tm_safe_or_pure (e->caller->decl))
4231 continue;
4233 caller = e->caller;
4234 d = get_cg_data (&caller, true);
4236 /* Check if the callee is in a transactional region. If so,
4237 schedule the function for normal re-scan as well. */
4238 bb = gimple_bb (e->call_stmt);
4239 gcc_assert (bb != NULL);
4240 if (d->transaction_blocks_normal
4241 && bitmap_bit_p (d->transaction_blocks_normal, bb->index))
4242 d->want_irr_scan_normal = true;
4244 maybe_push_queue (caller, worklist_p, &d->in_worklist);
4248 /* A subroutine of ipa_tm_scan_irr_blocks; return true iff any statement
4249 within the block is irrevocable. */
4251 static bool
4252 ipa_tm_scan_irr_block (basic_block bb)
4254 gimple_stmt_iterator gsi;
4255 tree fn;
4257 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
4259 gimple stmt = gsi_stmt (gsi);
4260 switch (gimple_code (stmt))
4262 case GIMPLE_ASSIGN:
4263 if (gimple_assign_single_p (stmt))
4265 tree lhs = gimple_assign_lhs (stmt);
4266 tree rhs = gimple_assign_rhs1 (stmt);
4267 if (volatile_var_p (lhs) || volatile_var_p (rhs))
4268 return true;
4270 break;
4272 case GIMPLE_CALL:
4274 tree lhs = gimple_call_lhs (stmt);
4275 if (lhs && volatile_var_p (lhs))
4276 return true;
4278 if (is_tm_pure_call (stmt))
4279 break;
4281 fn = gimple_call_fn (stmt);
4283 /* Functions with the attribute are by definition irrevocable. */
4284 if (is_tm_irrevocable (fn))
4285 return true;
4287 /* For direct function calls, go ahead and check for replacement
4288 functions, or transitive irrevocable functions. For indirect
4289 functions, we'll ask the runtime. */
4290 if (TREE_CODE (fn) == ADDR_EXPR)
4292 struct tm_ipa_cg_data *d;
4293 struct cgraph_node *node;
4295 fn = TREE_OPERAND (fn, 0);
4296 if (is_tm_ending_fndecl (fn))
4297 break;
4298 if (find_tm_replacement_function (fn))
4299 break;
4301 node = cgraph_get_node (fn);
4302 d = get_cg_data (&node, true);
4304 /* Return true if irrevocable, but above all, believe
4305 the user. */
4306 if (d->is_irrevocable
4307 && !is_tm_safe_or_pure (fn))
4308 return true;
4310 break;
4313 case GIMPLE_ASM:
4314 /* ??? The Approved Method of indicating that an inline
4315 assembly statement is not relevant to the transaction
4316 is to wrap it in a __tm_waiver block. This is not
4317 yet implemented, so we can't check for it. */
4318 if (is_tm_safe (current_function_decl))
4320 tree t = build1 (NOP_EXPR, void_type_node, size_zero_node);
4321 SET_EXPR_LOCATION (t, gimple_location (stmt));
4322 error ("%Kasm not allowed in %<transaction_safe%> function", t);
4324 return true;
4326 default:
4327 break;
4331 return false;
4334 /* For each of the blocks seeded witin PQUEUE, walk the CFG looking
4335 for new irrevocable blocks, marking them in NEW_IRR. Don't bother
4336 scanning past OLD_IRR or EXIT_BLOCKS. */
4338 static bool
4339 ipa_tm_scan_irr_blocks (vec<basic_block> *pqueue, bitmap new_irr,
4340 bitmap old_irr, bitmap exit_blocks)
4342 bool any_new_irr = false;
4343 edge e;
4344 edge_iterator ei;
4345 bitmap visited_blocks = BITMAP_ALLOC (NULL);
4349 basic_block bb = pqueue->pop ();
4351 /* Don't re-scan blocks we know already are irrevocable. */
4352 if (old_irr && bitmap_bit_p (old_irr, bb->index))
4353 continue;
4355 if (ipa_tm_scan_irr_block (bb))
4357 bitmap_set_bit (new_irr, bb->index);
4358 any_new_irr = true;
4360 else if (exit_blocks == NULL || !bitmap_bit_p (exit_blocks, bb->index))
4362 FOR_EACH_EDGE (e, ei, bb->succs)
4363 if (!bitmap_bit_p (visited_blocks, e->dest->index))
4365 bitmap_set_bit (visited_blocks, e->dest->index);
4366 pqueue->safe_push (e->dest);
4370 while (!pqueue->is_empty ());
4372 BITMAP_FREE (visited_blocks);
4374 return any_new_irr;
4377 /* Propagate the irrevocable property both up and down the dominator tree.
4378 BB is the current block being scanned; EXIT_BLOCKS are the edges of the
4379 TM regions; OLD_IRR are the results of a previous scan of the dominator
4380 tree which has been fully propagated; NEW_IRR is the set of new blocks
4381 which are gaining the irrevocable property during the current scan. */
4383 static void
4384 ipa_tm_propagate_irr (basic_block entry_block, bitmap new_irr,
4385 bitmap old_irr, bitmap exit_blocks)
4387 vec<basic_block> bbs;
4388 bitmap all_region_blocks;
4390 /* If this block is in the old set, no need to rescan. */
4391 if (old_irr && bitmap_bit_p (old_irr, entry_block->index))
4392 return;
4394 all_region_blocks = BITMAP_ALLOC (&tm_obstack);
4395 bbs = get_tm_region_blocks (entry_block, exit_blocks, NULL,
4396 all_region_blocks, false);
4399 basic_block bb = bbs.pop ();
4400 bool this_irr = bitmap_bit_p (new_irr, bb->index);
4401 bool all_son_irr = false;
4402 edge_iterator ei;
4403 edge e;
4405 /* Propagate up. If my children are, I am too, but we must have
4406 at least one child that is. */
4407 if (!this_irr)
4409 FOR_EACH_EDGE (e, ei, bb->succs)
4411 if (!bitmap_bit_p (new_irr, e->dest->index))
4413 all_son_irr = false;
4414 break;
4416 else
4417 all_son_irr = true;
4419 if (all_son_irr)
4421 /* Add block to new_irr if it hasn't already been processed. */
4422 if (!old_irr || !bitmap_bit_p (old_irr, bb->index))
4424 bitmap_set_bit (new_irr, bb->index);
4425 this_irr = true;
4430 /* Propagate down to everyone we immediately dominate. */
4431 if (this_irr)
4433 basic_block son;
4434 for (son = first_dom_son (CDI_DOMINATORS, bb);
4435 son;
4436 son = next_dom_son (CDI_DOMINATORS, son))
4438 /* Make sure block is actually in a TM region, and it
4439 isn't already in old_irr. */
4440 if ((!old_irr || !bitmap_bit_p (old_irr, son->index))
4441 && bitmap_bit_p (all_region_blocks, son->index))
4442 bitmap_set_bit (new_irr, son->index);
4446 while (!bbs.is_empty ());
4448 BITMAP_FREE (all_region_blocks);
4449 bbs.release ();
4452 static void
4453 ipa_tm_decrement_clone_counts (basic_block bb, bool for_clone)
4455 gimple_stmt_iterator gsi;
4457 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
4459 gimple stmt = gsi_stmt (gsi);
4460 if (is_gimple_call (stmt) && !is_tm_pure_call (stmt))
4462 tree fndecl = gimple_call_fndecl (stmt);
4463 if (fndecl)
4465 struct tm_ipa_cg_data *d;
4466 unsigned *pcallers;
4467 struct cgraph_node *tnode;
4469 if (is_tm_ending_fndecl (fndecl))
4470 continue;
4471 if (find_tm_replacement_function (fndecl))
4472 continue;
4474 tnode = cgraph_get_node (fndecl);
4475 d = get_cg_data (&tnode, true);
4477 pcallers = (for_clone ? &d->tm_callers_clone
4478 : &d->tm_callers_normal);
4480 gcc_assert (*pcallers > 0);
4481 *pcallers -= 1;
4487 /* (Re-)Scan the transaction blocks in NODE for calls to irrevocable functions,
4488 as well as other irrevocable actions such as inline assembly. Mark all
4489 such blocks as irrevocable and decrement the number of calls to
4490 transactional clones. Return true if, for the transactional clone, the
4491 entire function is irrevocable. */
4493 static bool
4494 ipa_tm_scan_irr_function (struct cgraph_node *node, bool for_clone)
4496 struct tm_ipa_cg_data *d;
4497 bitmap new_irr, old_irr;
4498 bool ret = false;
4500 /* Builtin operators (operator new, and such). */
4501 if (DECL_STRUCT_FUNCTION (node->decl) == NULL
4502 || DECL_STRUCT_FUNCTION (node->decl)->cfg == NULL)
4503 return false;
4505 push_cfun (DECL_STRUCT_FUNCTION (node->decl));
4506 calculate_dominance_info (CDI_DOMINATORS);
4508 d = get_cg_data (&node, true);
4509 auto_vec<basic_block, 10> queue;
4510 new_irr = BITMAP_ALLOC (&tm_obstack);
4512 /* Scan each tm region, propagating irrevocable status through the tree. */
4513 if (for_clone)
4515 old_irr = d->irrevocable_blocks_clone;
4516 queue.quick_push (single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
4517 if (ipa_tm_scan_irr_blocks (&queue, new_irr, old_irr, NULL))
4519 ipa_tm_propagate_irr (single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun)),
4520 new_irr,
4521 old_irr, NULL);
4522 ret = bitmap_bit_p (new_irr,
4523 single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun))->index);
4526 else
4528 struct tm_region *region;
4530 old_irr = d->irrevocable_blocks_normal;
4531 for (region = d->all_tm_regions; region; region = region->next)
4533 queue.quick_push (region->entry_block);
4534 if (ipa_tm_scan_irr_blocks (&queue, new_irr, old_irr,
4535 region->exit_blocks))
4536 ipa_tm_propagate_irr (region->entry_block, new_irr, old_irr,
4537 region->exit_blocks);
4541 /* If we found any new irrevocable blocks, reduce the call count for
4542 transactional clones within the irrevocable blocks. Save the new
4543 set of irrevocable blocks for next time. */
4544 if (!bitmap_empty_p (new_irr))
4546 bitmap_iterator bmi;
4547 unsigned i;
4549 EXECUTE_IF_SET_IN_BITMAP (new_irr, 0, i, bmi)
4550 ipa_tm_decrement_clone_counts (BASIC_BLOCK_FOR_FN (cfun, i),
4551 for_clone);
4553 if (old_irr)
4555 bitmap_ior_into (old_irr, new_irr);
4556 BITMAP_FREE (new_irr);
4558 else if (for_clone)
4559 d->irrevocable_blocks_clone = new_irr;
4560 else
4561 d->irrevocable_blocks_normal = new_irr;
4563 if (dump_file && new_irr)
4565 const char *dname;
4566 bitmap_iterator bmi;
4567 unsigned i;
4569 dname = lang_hooks.decl_printable_name (current_function_decl, 2);
4570 EXECUTE_IF_SET_IN_BITMAP (new_irr, 0, i, bmi)
4571 fprintf (dump_file, "%s: bb %d goes irrevocable\n", dname, i);
4574 else
4575 BITMAP_FREE (new_irr);
4577 pop_cfun ();
4579 return ret;
4582 /* Return true if, for the transactional clone of NODE, any call
4583 may enter irrevocable mode. */
4585 static bool
4586 ipa_tm_mayenterirr_function (struct cgraph_node *node)
4588 struct tm_ipa_cg_data *d;
4589 tree decl;
4590 unsigned flags;
4592 d = get_cg_data (&node, true);
4593 decl = node->decl;
4594 flags = flags_from_decl_or_type (decl);
4596 /* Handle some TM builtins. Ordinarily these aren't actually generated
4597 at this point, but handling these functions when written in by the
4598 user makes it easier to build unit tests. */
4599 if (flags & ECF_TM_BUILTIN)
4600 return false;
4602 /* Filter out all functions that are marked. */
4603 if (flags & ECF_TM_PURE)
4604 return false;
4605 if (is_tm_safe (decl))
4606 return false;
4607 if (is_tm_irrevocable (decl))
4608 return true;
4609 if (is_tm_callable (decl))
4610 return true;
4611 if (find_tm_replacement_function (decl))
4612 return true;
4614 /* If we aren't seeing the final version of the function we don't
4615 know what it will contain at runtime. */
4616 if (cgraph_function_body_availability (node) < AVAIL_AVAILABLE)
4617 return true;
4619 /* If the function must go irrevocable, then of course true. */
4620 if (d->is_irrevocable)
4621 return true;
4623 /* If there are any blocks marked irrevocable, then the function
4624 as a whole may enter irrevocable. */
4625 if (d->irrevocable_blocks_clone)
4626 return true;
4628 /* We may have previously marked this function as tm_may_enter_irr;
4629 see pass_diagnose_tm_blocks. */
4630 if (node->local.tm_may_enter_irr)
4631 return true;
4633 /* Recurse on the main body for aliases. In general, this will
4634 result in one of the bits above being set so that we will not
4635 have to recurse next time. */
4636 if (node->alias)
4637 return ipa_tm_mayenterirr_function (cgraph_get_node (node->thunk.alias));
4639 /* What remains is unmarked local functions without items that force
4640 the function to go irrevocable. */
4641 return false;
4644 /* Diagnose calls from transaction_safe functions to unmarked
4645 functions that are determined to not be safe. */
4647 static void
4648 ipa_tm_diagnose_tm_safe (struct cgraph_node *node)
4650 struct cgraph_edge *e;
4652 for (e = node->callees; e ; e = e->next_callee)
4653 if (!is_tm_callable (e->callee->decl)
4654 && e->callee->local.tm_may_enter_irr)
4655 error_at (gimple_location (e->call_stmt),
4656 "unsafe function call %qD within "
4657 "%<transaction_safe%> function", e->callee->decl);
4660 /* Diagnose call from atomic transactions to unmarked functions
4661 that are determined to not be safe. */
4663 static void
4664 ipa_tm_diagnose_transaction (struct cgraph_node *node,
4665 struct tm_region *all_tm_regions)
4667 struct tm_region *r;
4669 for (r = all_tm_regions; r ; r = r->next)
4670 if (gimple_transaction_subcode (r->transaction_stmt) & GTMA_IS_RELAXED)
4672 /* Atomic transactions can be nested inside relaxed. */
4673 if (r->inner)
4674 ipa_tm_diagnose_transaction (node, r->inner);
4676 else
4678 vec<basic_block> bbs;
4679 gimple_stmt_iterator gsi;
4680 basic_block bb;
4681 size_t i;
4683 bbs = get_tm_region_blocks (r->entry_block, r->exit_blocks,
4684 r->irr_blocks, NULL, false);
4686 for (i = 0; bbs.iterate (i, &bb); ++i)
4687 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
4689 gimple stmt = gsi_stmt (gsi);
4690 tree fndecl;
4692 if (gimple_code (stmt) == GIMPLE_ASM)
4694 error_at (gimple_location (stmt),
4695 "asm not allowed in atomic transaction");
4696 continue;
4699 if (!is_gimple_call (stmt))
4700 continue;
4701 fndecl = gimple_call_fndecl (stmt);
4703 /* Indirect function calls have been diagnosed already. */
4704 if (!fndecl)
4705 continue;
4707 /* Stop at the end of the transaction. */
4708 if (is_tm_ending_fndecl (fndecl))
4710 if (bitmap_bit_p (r->exit_blocks, bb->index))
4711 break;
4712 continue;
4715 /* Marked functions have been diagnosed already. */
4716 if (is_tm_pure_call (stmt))
4717 continue;
4718 if (is_tm_callable (fndecl))
4719 continue;
4721 if (cgraph_local_info (fndecl)->tm_may_enter_irr)
4722 error_at (gimple_location (stmt),
4723 "unsafe function call %qD within "
4724 "atomic transaction", fndecl);
4727 bbs.release ();
4731 /* Return a transactional mangled name for the DECL_ASSEMBLER_NAME in
4732 OLD_DECL. The returned value is a freshly malloced pointer that
4733 should be freed by the caller. */
4735 static tree
4736 tm_mangle (tree old_asm_id)
4738 const char *old_asm_name;
4739 char *tm_name;
4740 void *alloc = NULL;
4741 struct demangle_component *dc;
4742 tree new_asm_id;
4744 /* Determine if the symbol is already a valid C++ mangled name. Do this
4745 even for C, which might be interfacing with C++ code via appropriately
4746 ugly identifiers. */
4747 /* ??? We could probably do just as well checking for "_Z" and be done. */
4748 old_asm_name = IDENTIFIER_POINTER (old_asm_id);
4749 dc = cplus_demangle_v3_components (old_asm_name, DMGL_NO_OPTS, &alloc);
4751 if (dc == NULL)
4753 char length[8];
4755 do_unencoded:
4756 sprintf (length, "%u", IDENTIFIER_LENGTH (old_asm_id));
4757 tm_name = concat ("_ZGTt", length, old_asm_name, NULL);
4759 else
4761 old_asm_name += 2; /* Skip _Z */
4763 switch (dc->type)
4765 case DEMANGLE_COMPONENT_TRANSACTION_CLONE:
4766 case DEMANGLE_COMPONENT_NONTRANSACTION_CLONE:
4767 /* Don't play silly games, you! */
4768 goto do_unencoded;
4770 case DEMANGLE_COMPONENT_HIDDEN_ALIAS:
4771 /* I'd really like to know if we can ever be passed one of
4772 these from the C++ front end. The Logical Thing would
4773 seem that hidden-alias should be outer-most, so that we
4774 get hidden-alias of a transaction-clone and not vice-versa. */
4775 old_asm_name += 2;
4776 break;
4778 default:
4779 break;
4782 tm_name = concat ("_ZGTt", old_asm_name, NULL);
4784 free (alloc);
4786 new_asm_id = get_identifier (tm_name);
4787 free (tm_name);
4789 return new_asm_id;
4792 static inline void
4793 ipa_tm_mark_force_output_node (struct cgraph_node *node)
4795 cgraph_mark_force_output_node (node);
4796 node->analyzed = true;
4799 static inline void
4800 ipa_tm_mark_forced_by_abi_node (struct cgraph_node *node)
4802 node->forced_by_abi = true;
4803 node->analyzed = true;
4806 /* Callback data for ipa_tm_create_version_alias. */
4807 struct create_version_alias_info
4809 struct cgraph_node *old_node;
4810 tree new_decl;
4813 /* A subroutine of ipa_tm_create_version, called via
4814 cgraph_for_node_and_aliases. Create new tm clones for each of
4815 the existing aliases. */
4816 static bool
4817 ipa_tm_create_version_alias (struct cgraph_node *node, void *data)
4819 struct create_version_alias_info *info
4820 = (struct create_version_alias_info *)data;
4821 tree old_decl, new_decl, tm_name;
4822 struct cgraph_node *new_node;
4824 if (!node->cpp_implicit_alias)
4825 return false;
4827 old_decl = node->decl;
4828 tm_name = tm_mangle (DECL_ASSEMBLER_NAME (old_decl));
4829 new_decl = build_decl (DECL_SOURCE_LOCATION (old_decl),
4830 TREE_CODE (old_decl), tm_name,
4831 TREE_TYPE (old_decl));
4833 SET_DECL_ASSEMBLER_NAME (new_decl, tm_name);
4834 SET_DECL_RTL (new_decl, NULL);
4836 /* Based loosely on C++'s make_alias_for(). */
4837 TREE_PUBLIC (new_decl) = TREE_PUBLIC (old_decl);
4838 DECL_CONTEXT (new_decl) = DECL_CONTEXT (old_decl);
4839 DECL_LANG_SPECIFIC (new_decl) = DECL_LANG_SPECIFIC (old_decl);
4840 TREE_READONLY (new_decl) = TREE_READONLY (old_decl);
4841 DECL_EXTERNAL (new_decl) = 0;
4842 DECL_ARTIFICIAL (new_decl) = 1;
4843 TREE_ADDRESSABLE (new_decl) = 1;
4844 TREE_USED (new_decl) = 1;
4845 TREE_SYMBOL_REFERENCED (tm_name) = 1;
4847 /* Perform the same remapping to the comdat group. */
4848 if (DECL_ONE_ONLY (new_decl))
4849 varpool_get_node (new_decl)->set_comdat_group (tm_mangle (decl_comdat_group_id (old_decl)));
4851 new_node = cgraph_same_body_alias (NULL, new_decl, info->new_decl);
4852 new_node->tm_clone = true;
4853 new_node->externally_visible = info->old_node->externally_visible;
4854 /* ?? Do not traverse aliases here. */
4855 get_cg_data (&node, false)->clone = new_node;
4857 record_tm_clone_pair (old_decl, new_decl);
4859 if (info->old_node->force_output
4860 || ipa_ref_list_first_referring (&info->old_node->ref_list))
4861 ipa_tm_mark_force_output_node (new_node);
4862 if (info->old_node->forced_by_abi)
4863 ipa_tm_mark_forced_by_abi_node (new_node);
4864 return false;
4867 /* Create a copy of the function (possibly declaration only) of OLD_NODE,
4868 appropriate for the transactional clone. */
4870 static void
4871 ipa_tm_create_version (struct cgraph_node *old_node)
4873 tree new_decl, old_decl, tm_name;
4874 struct cgraph_node *new_node;
4876 old_decl = old_node->decl;
4877 new_decl = copy_node (old_decl);
4879 /* DECL_ASSEMBLER_NAME needs to be set before we call
4880 cgraph_copy_node_for_versioning below, because cgraph_node will
4881 fill the assembler_name_hash. */
4882 tm_name = tm_mangle (DECL_ASSEMBLER_NAME (old_decl));
4883 SET_DECL_ASSEMBLER_NAME (new_decl, tm_name);
4884 SET_DECL_RTL (new_decl, NULL);
4885 TREE_SYMBOL_REFERENCED (tm_name) = 1;
4887 /* Perform the same remapping to the comdat group. */
4888 if (DECL_ONE_ONLY (new_decl))
4889 varpool_get_node (new_decl)->set_comdat_group (tm_mangle (DECL_COMDAT_GROUP (old_decl)));
4891 gcc_assert (!old_node->ipa_transforms_to_apply.exists ());
4892 new_node = cgraph_copy_node_for_versioning (old_node, new_decl, vNULL, NULL);
4893 new_node->local.local = false;
4894 new_node->externally_visible = old_node->externally_visible;
4895 new_node->lowered = true;
4896 new_node->tm_clone = 1;
4897 get_cg_data (&old_node, true)->clone = new_node;
4899 if (cgraph_function_body_availability (old_node) >= AVAIL_OVERWRITABLE)
4901 /* Remap extern inline to static inline. */
4902 /* ??? Is it worth trying to use make_decl_one_only? */
4903 if (DECL_DECLARED_INLINE_P (new_decl) && DECL_EXTERNAL (new_decl))
4905 DECL_EXTERNAL (new_decl) = 0;
4906 TREE_PUBLIC (new_decl) = 0;
4907 DECL_WEAK (new_decl) = 0;
4910 tree_function_versioning (old_decl, new_decl,
4911 NULL, false, NULL,
4912 false, NULL, NULL);
4915 record_tm_clone_pair (old_decl, new_decl);
4917 cgraph_call_function_insertion_hooks (new_node);
4918 if (old_node->force_output
4919 || ipa_ref_list_first_referring (&old_node->ref_list))
4920 ipa_tm_mark_force_output_node (new_node);
4921 if (old_node->forced_by_abi)
4922 ipa_tm_mark_forced_by_abi_node (new_node);
4924 /* Do the same thing, but for any aliases of the original node. */
4926 struct create_version_alias_info data;
4927 data.old_node = old_node;
4928 data.new_decl = new_decl;
4929 cgraph_for_node_and_aliases (old_node, ipa_tm_create_version_alias,
4930 &data, true);
4934 /* Construct a call to TM_IRREVOCABLE and insert it at the beginning of BB. */
4936 static void
4937 ipa_tm_insert_irr_call (struct cgraph_node *node, struct tm_region *region,
4938 basic_block bb)
4940 gimple_stmt_iterator gsi;
4941 gimple g;
4943 transaction_subcode_ior (region, GTMA_MAY_ENTER_IRREVOCABLE);
4945 g = gimple_build_call (builtin_decl_explicit (BUILT_IN_TM_IRREVOCABLE),
4946 1, build_int_cst (NULL_TREE, MODE_SERIALIRREVOCABLE));
4948 split_block_after_labels (bb);
4949 gsi = gsi_after_labels (bb);
4950 gsi_insert_before (&gsi, g, GSI_SAME_STMT);
4952 cgraph_create_edge (node,
4953 cgraph_get_create_node
4954 (builtin_decl_explicit (BUILT_IN_TM_IRREVOCABLE)),
4955 g, 0,
4956 compute_call_stmt_bb_frequency (node->decl,
4957 gimple_bb (g)));
4960 /* Construct a call to TM_GETTMCLONE and insert it before GSI. */
4962 static bool
4963 ipa_tm_insert_gettmclone_call (struct cgraph_node *node,
4964 struct tm_region *region,
4965 gimple_stmt_iterator *gsi, gimple stmt)
4967 tree gettm_fn, ret, old_fn, callfn;
4968 gimple g, g2;
4969 bool safe;
4971 old_fn = gimple_call_fn (stmt);
4973 if (TREE_CODE (old_fn) == ADDR_EXPR)
4975 tree fndecl = TREE_OPERAND (old_fn, 0);
4976 tree clone = get_tm_clone_pair (fndecl);
4978 /* By transforming the call into a TM_GETTMCLONE, we are
4979 technically taking the address of the original function and
4980 its clone. Explain this so inlining will know this function
4981 is needed. */
4982 cgraph_mark_address_taken_node (cgraph_get_node (fndecl));
4983 if (clone)
4984 cgraph_mark_address_taken_node (cgraph_get_node (clone));
4987 safe = is_tm_safe (TREE_TYPE (old_fn));
4988 gettm_fn = builtin_decl_explicit (safe ? BUILT_IN_TM_GETTMCLONE_SAFE
4989 : BUILT_IN_TM_GETTMCLONE_IRR);
4990 ret = create_tmp_var (ptr_type_node, NULL);
4992 if (!safe)
4993 transaction_subcode_ior (region, GTMA_MAY_ENTER_IRREVOCABLE);
4995 /* Discard OBJ_TYPE_REF, since we weren't able to fold it. */
4996 if (TREE_CODE (old_fn) == OBJ_TYPE_REF)
4997 old_fn = OBJ_TYPE_REF_EXPR (old_fn);
4999 g = gimple_build_call (gettm_fn, 1, old_fn);
5000 ret = make_ssa_name (ret, g);
5001 gimple_call_set_lhs (g, ret);
5003 gsi_insert_before (gsi, g, GSI_SAME_STMT);
5005 cgraph_create_edge (node, cgraph_get_create_node (gettm_fn), g, 0,
5006 compute_call_stmt_bb_frequency (node->decl,
5007 gimple_bb (g)));
5009 /* Cast return value from tm_gettmclone* into appropriate function
5010 pointer. */
5011 callfn = create_tmp_var (TREE_TYPE (old_fn), NULL);
5012 g2 = gimple_build_assign (callfn,
5013 fold_build1 (NOP_EXPR, TREE_TYPE (callfn), ret));
5014 callfn = make_ssa_name (callfn, g2);
5015 gimple_assign_set_lhs (g2, callfn);
5016 gsi_insert_before (gsi, g2, GSI_SAME_STMT);
5018 /* ??? This is a hack to preserve the NOTHROW bit on the call,
5019 which we would have derived from the decl. Failure to save
5020 this bit means we might have to split the basic block. */
5021 if (gimple_call_nothrow_p (stmt))
5022 gimple_call_set_nothrow (stmt, true);
5024 gimple_call_set_fn (stmt, callfn);
5026 /* Discarding OBJ_TYPE_REF above may produce incompatible LHS and RHS
5027 for a call statement. Fix it. */
5029 tree lhs = gimple_call_lhs (stmt);
5030 tree rettype = TREE_TYPE (gimple_call_fntype (stmt));
5031 if (lhs
5032 && !useless_type_conversion_p (TREE_TYPE (lhs), rettype))
5034 tree temp;
5036 temp = create_tmp_reg (rettype, 0);
5037 gimple_call_set_lhs (stmt, temp);
5039 g2 = gimple_build_assign (lhs,
5040 fold_build1 (VIEW_CONVERT_EXPR,
5041 TREE_TYPE (lhs), temp));
5042 gsi_insert_after (gsi, g2, GSI_SAME_STMT);
5046 update_stmt (stmt);
5048 return true;
5051 /* Helper function for ipa_tm_transform_calls*. Given a call
5052 statement in GSI which resides inside transaction REGION, redirect
5053 the call to either its wrapper function, or its clone. */
5055 static void
5056 ipa_tm_transform_calls_redirect (struct cgraph_node *node,
5057 struct tm_region *region,
5058 gimple_stmt_iterator *gsi,
5059 bool *need_ssa_rename_p)
5061 gimple stmt = gsi_stmt (*gsi);
5062 struct cgraph_node *new_node;
5063 struct cgraph_edge *e = cgraph_edge (node, stmt);
5064 tree fndecl = gimple_call_fndecl (stmt);
5066 /* For indirect calls, pass the address through the runtime. */
5067 if (fndecl == NULL)
5069 *need_ssa_rename_p |=
5070 ipa_tm_insert_gettmclone_call (node, region, gsi, stmt);
5071 return;
5074 /* Handle some TM builtins. Ordinarily these aren't actually generated
5075 at this point, but handling these functions when written in by the
5076 user makes it easier to build unit tests. */
5077 if (flags_from_decl_or_type (fndecl) & ECF_TM_BUILTIN)
5078 return;
5080 /* Fixup recursive calls inside clones. */
5081 /* ??? Why did cgraph_copy_node_for_versioning update the call edges
5082 for recursion but not update the call statements themselves? */
5083 if (e->caller == e->callee && decl_is_tm_clone (current_function_decl))
5085 gimple_call_set_fndecl (stmt, current_function_decl);
5086 return;
5089 /* If there is a replacement, use it. */
5090 fndecl = find_tm_replacement_function (fndecl);
5091 if (fndecl)
5093 new_node = cgraph_get_create_node (fndecl);
5095 /* ??? Mark all transaction_wrap functions tm_may_enter_irr.
5097 We can't do this earlier in record_tm_replacement because
5098 cgraph_remove_unreachable_nodes is called before we inject
5099 references to the node. Further, we can't do this in some
5100 nice central place in ipa_tm_execute because we don't have
5101 the exact list of wrapper functions that would be used.
5102 Marking more wrappers than necessary results in the creation
5103 of unnecessary cgraph_nodes, which can cause some of the
5104 other IPA passes to crash.
5106 We do need to mark these nodes so that we get the proper
5107 result in expand_call_tm. */
5108 /* ??? This seems broken. How is it that we're marking the
5109 CALLEE as may_enter_irr? Surely we should be marking the
5110 CALLER. Also note that find_tm_replacement_function also
5111 contains mappings into the TM runtime, e.g. memcpy. These
5112 we know won't go irrevocable. */
5113 new_node->local.tm_may_enter_irr = 1;
5115 else
5117 struct tm_ipa_cg_data *d;
5118 struct cgraph_node *tnode = e->callee;
5120 d = get_cg_data (&tnode, true);
5121 new_node = d->clone;
5123 /* As we've already skipped pure calls and appropriate builtins,
5124 and we've already marked irrevocable blocks, if we can't come
5125 up with a static replacement, then ask the runtime. */
5126 if (new_node == NULL)
5128 *need_ssa_rename_p |=
5129 ipa_tm_insert_gettmclone_call (node, region, gsi, stmt);
5130 return;
5133 fndecl = new_node->decl;
5136 cgraph_redirect_edge_callee (e, new_node);
5137 gimple_call_set_fndecl (stmt, fndecl);
5140 /* Helper function for ipa_tm_transform_calls. For a given BB,
5141 install calls to tm_irrevocable when IRR_BLOCKS are reached,
5142 redirect other calls to the generated transactional clone. */
5144 static bool
5145 ipa_tm_transform_calls_1 (struct cgraph_node *node, struct tm_region *region,
5146 basic_block bb, bitmap irr_blocks)
5148 gimple_stmt_iterator gsi;
5149 bool need_ssa_rename = false;
5151 if (irr_blocks && bitmap_bit_p (irr_blocks, bb->index))
5153 ipa_tm_insert_irr_call (node, region, bb);
5154 return true;
5157 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
5159 gimple stmt = gsi_stmt (gsi);
5161 if (!is_gimple_call (stmt))
5162 continue;
5163 if (is_tm_pure_call (stmt))
5164 continue;
5166 /* Redirect edges to the appropriate replacement or clone. */
5167 ipa_tm_transform_calls_redirect (node, region, &gsi, &need_ssa_rename);
5170 return need_ssa_rename;
5173 /* Walk the CFG for REGION, beginning at BB. Install calls to
5174 tm_irrevocable when IRR_BLOCKS are reached, redirect other calls to
5175 the generated transactional clone. */
5177 static bool
5178 ipa_tm_transform_calls (struct cgraph_node *node, struct tm_region *region,
5179 basic_block bb, bitmap irr_blocks)
5181 bool need_ssa_rename = false;
5182 edge e;
5183 edge_iterator ei;
5184 auto_vec<basic_block> queue;
5185 bitmap visited_blocks = BITMAP_ALLOC (NULL);
5187 queue.safe_push (bb);
5190 bb = queue.pop ();
5192 need_ssa_rename |=
5193 ipa_tm_transform_calls_1 (node, region, bb, irr_blocks);
5195 if (irr_blocks && bitmap_bit_p (irr_blocks, bb->index))
5196 continue;
5198 if (region && bitmap_bit_p (region->exit_blocks, bb->index))
5199 continue;
5201 FOR_EACH_EDGE (e, ei, bb->succs)
5202 if (!bitmap_bit_p (visited_blocks, e->dest->index))
5204 bitmap_set_bit (visited_blocks, e->dest->index);
5205 queue.safe_push (e->dest);
5208 while (!queue.is_empty ());
5210 BITMAP_FREE (visited_blocks);
5212 return need_ssa_rename;
5215 /* Transform the calls within the TM regions within NODE. */
5217 static void
5218 ipa_tm_transform_transaction (struct cgraph_node *node)
5220 struct tm_ipa_cg_data *d;
5221 struct tm_region *region;
5222 bool need_ssa_rename = false;
5224 d = get_cg_data (&node, true);
5226 push_cfun (DECL_STRUCT_FUNCTION (node->decl));
5227 calculate_dominance_info (CDI_DOMINATORS);
5229 for (region = d->all_tm_regions; region; region = region->next)
5231 /* If we're sure to go irrevocable, don't transform anything. */
5232 if (d->irrevocable_blocks_normal
5233 && bitmap_bit_p (d->irrevocable_blocks_normal,
5234 region->entry_block->index))
5236 transaction_subcode_ior (region, GTMA_DOES_GO_IRREVOCABLE
5237 | GTMA_MAY_ENTER_IRREVOCABLE
5238 | GTMA_HAS_NO_INSTRUMENTATION);
5239 continue;
5242 need_ssa_rename |=
5243 ipa_tm_transform_calls (node, region, region->entry_block,
5244 d->irrevocable_blocks_normal);
5247 if (need_ssa_rename)
5248 update_ssa (TODO_update_ssa_only_virtuals);
5250 pop_cfun ();
5253 /* Transform the calls within the transactional clone of NODE. */
5255 static void
5256 ipa_tm_transform_clone (struct cgraph_node *node)
5258 struct tm_ipa_cg_data *d;
5259 bool need_ssa_rename;
5261 d = get_cg_data (&node, true);
5263 /* If this function makes no calls and has no irrevocable blocks,
5264 then there's nothing to do. */
5265 /* ??? Remove non-aborting top-level transactions. */
5266 if (!node->callees && !node->indirect_calls && !d->irrevocable_blocks_clone)
5267 return;
5269 push_cfun (DECL_STRUCT_FUNCTION (d->clone->decl));
5270 calculate_dominance_info (CDI_DOMINATORS);
5272 need_ssa_rename =
5273 ipa_tm_transform_calls (d->clone, NULL,
5274 single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun)),
5275 d->irrevocable_blocks_clone);
5277 if (need_ssa_rename)
5278 update_ssa (TODO_update_ssa_only_virtuals);
5280 pop_cfun ();
5283 /* Main entry point for the transactional memory IPA pass. */
5285 static unsigned int
5286 ipa_tm_execute (void)
5288 cgraph_node_queue tm_callees = cgraph_node_queue ();
5289 /* List of functions that will go irrevocable. */
5290 cgraph_node_queue irr_worklist = cgraph_node_queue ();
5292 struct cgraph_node *node;
5293 struct tm_ipa_cg_data *d;
5294 enum availability a;
5295 unsigned int i;
5297 #ifdef ENABLE_CHECKING
5298 verify_cgraph ();
5299 #endif
5301 bitmap_obstack_initialize (&tm_obstack);
5302 initialize_original_copy_tables ();
5304 /* For all local functions marked tm_callable, queue them. */
5305 FOR_EACH_DEFINED_FUNCTION (node)
5306 if (is_tm_callable (node->decl)
5307 && cgraph_function_body_availability (node) >= AVAIL_OVERWRITABLE)
5309 d = get_cg_data (&node, true);
5310 maybe_push_queue (node, &tm_callees, &d->in_callee_queue);
5313 /* For all local reachable functions... */
5314 FOR_EACH_DEFINED_FUNCTION (node)
5315 if (node->lowered
5316 && cgraph_function_body_availability (node) >= AVAIL_OVERWRITABLE)
5318 /* ... marked tm_pure, record that fact for the runtime by
5319 indicating that the pure function is its own tm_callable.
5320 No need to do this if the function's address can't be taken. */
5321 if (is_tm_pure (node->decl))
5323 if (!node->local.local)
5324 record_tm_clone_pair (node->decl, node->decl);
5325 continue;
5328 push_cfun (DECL_STRUCT_FUNCTION (node->decl));
5329 calculate_dominance_info (CDI_DOMINATORS);
5331 tm_region_init (NULL);
5332 if (all_tm_regions)
5334 d = get_cg_data (&node, true);
5336 /* Scan for calls that are in each transaction, and
5337 generate the uninstrumented code path. */
5338 ipa_tm_scan_calls_transaction (d, &tm_callees);
5340 /* Put it in the worklist so we can scan the function
5341 later (ipa_tm_scan_irr_function) and mark the
5342 irrevocable blocks. */
5343 maybe_push_queue (node, &irr_worklist, &d->in_worklist);
5344 d->want_irr_scan_normal = true;
5347 pop_cfun ();
5350 /* For every local function on the callee list, scan as if we will be
5351 creating a transactional clone, queueing all new functions we find
5352 along the way. */
5353 for (i = 0; i < tm_callees.length (); ++i)
5355 node = tm_callees[i];
5356 a = cgraph_function_body_availability (node);
5357 d = get_cg_data (&node, true);
5359 /* Put it in the worklist so we can scan the function later
5360 (ipa_tm_scan_irr_function) and mark the irrevocable
5361 blocks. */
5362 maybe_push_queue (node, &irr_worklist, &d->in_worklist);
5364 /* Some callees cannot be arbitrarily cloned. These will always be
5365 irrevocable. Mark these now, so that we need not scan them. */
5366 if (is_tm_irrevocable (node->decl))
5367 ipa_tm_note_irrevocable (node, &irr_worklist);
5368 else if (a <= AVAIL_NOT_AVAILABLE
5369 && !is_tm_safe_or_pure (node->decl))
5370 ipa_tm_note_irrevocable (node, &irr_worklist);
5371 else if (a >= AVAIL_OVERWRITABLE)
5373 if (!tree_versionable_function_p (node->decl))
5374 ipa_tm_note_irrevocable (node, &irr_worklist);
5375 else if (!d->is_irrevocable)
5377 /* If this is an alias, make sure its base is queued as well.
5378 we need not scan the callees now, as the base will do. */
5379 if (node->alias)
5381 node = cgraph_get_node (node->thunk.alias);
5382 d = get_cg_data (&node, true);
5383 maybe_push_queue (node, &tm_callees, &d->in_callee_queue);
5384 continue;
5387 /* Add all nodes called by this function into
5388 tm_callees as well. */
5389 ipa_tm_scan_calls_clone (node, &tm_callees);
5394 /* Iterate scans until no more work to be done. Prefer not to use
5395 vec::pop because the worklist tends to follow a breadth-first
5396 search of the callgraph, which should allow convergance with a
5397 minimum number of scans. But we also don't want the worklist
5398 array to grow without bound, so we shift the array up periodically. */
5399 for (i = 0; i < irr_worklist.length (); ++i)
5401 if (i > 256 && i == irr_worklist.length () / 8)
5403 irr_worklist.block_remove (0, i);
5404 i = 0;
5407 node = irr_worklist[i];
5408 d = get_cg_data (&node, true);
5409 d->in_worklist = false;
5411 if (d->want_irr_scan_normal)
5413 d->want_irr_scan_normal = false;
5414 ipa_tm_scan_irr_function (node, false);
5416 if (d->in_callee_queue && ipa_tm_scan_irr_function (node, true))
5417 ipa_tm_note_irrevocable (node, &irr_worklist);
5420 /* For every function on the callee list, collect the tm_may_enter_irr
5421 bit on the node. */
5422 irr_worklist.truncate (0);
5423 for (i = 0; i < tm_callees.length (); ++i)
5425 node = tm_callees[i];
5426 if (ipa_tm_mayenterirr_function (node))
5428 d = get_cg_data (&node, true);
5429 gcc_assert (d->in_worklist == false);
5430 maybe_push_queue (node, &irr_worklist, &d->in_worklist);
5434 /* Propagate the tm_may_enter_irr bit to callers until stable. */
5435 for (i = 0; i < irr_worklist.length (); ++i)
5437 struct cgraph_node *caller;
5438 struct cgraph_edge *e;
5439 struct ipa_ref *ref;
5440 unsigned j;
5442 if (i > 256 && i == irr_worklist.length () / 8)
5444 irr_worklist.block_remove (0, i);
5445 i = 0;
5448 node = irr_worklist[i];
5449 d = get_cg_data (&node, true);
5450 d->in_worklist = false;
5451 node->local.tm_may_enter_irr = true;
5453 /* Propagate back to normal callers. */
5454 for (e = node->callers; e ; e = e->next_caller)
5456 caller = e->caller;
5457 if (!is_tm_safe_or_pure (caller->decl)
5458 && !caller->local.tm_may_enter_irr)
5460 d = get_cg_data (&caller, true);
5461 maybe_push_queue (caller, &irr_worklist, &d->in_worklist);
5465 /* Propagate back to referring aliases as well. */
5466 for (j = 0; ipa_ref_list_referring_iterate (&node->ref_list, j, ref); j++)
5468 caller = cgraph (ref->referring);
5469 if (ref->use == IPA_REF_ALIAS
5470 && !caller->local.tm_may_enter_irr)
5472 /* ?? Do not traverse aliases here. */
5473 d = get_cg_data (&caller, false);
5474 maybe_push_queue (caller, &irr_worklist, &d->in_worklist);
5479 /* Now validate all tm_safe functions, and all atomic regions in
5480 other functions. */
5481 FOR_EACH_DEFINED_FUNCTION (node)
5482 if (node->lowered
5483 && cgraph_function_body_availability (node) >= AVAIL_OVERWRITABLE)
5485 d = get_cg_data (&node, true);
5486 if (is_tm_safe (node->decl))
5487 ipa_tm_diagnose_tm_safe (node);
5488 else if (d->all_tm_regions)
5489 ipa_tm_diagnose_transaction (node, d->all_tm_regions);
5492 /* Create clones. Do those that are not irrevocable and have a
5493 positive call count. Do those publicly visible functions that
5494 the user directed us to clone. */
5495 for (i = 0; i < tm_callees.length (); ++i)
5497 bool doit = false;
5499 node = tm_callees[i];
5500 if (node->cpp_implicit_alias)
5501 continue;
5503 a = cgraph_function_body_availability (node);
5504 d = get_cg_data (&node, true);
5506 if (a <= AVAIL_NOT_AVAILABLE)
5507 doit = is_tm_callable (node->decl);
5508 else if (a <= AVAIL_AVAILABLE && is_tm_callable (node->decl))
5509 doit = true;
5510 else if (!d->is_irrevocable
5511 && d->tm_callers_normal + d->tm_callers_clone > 0)
5512 doit = true;
5514 if (doit)
5515 ipa_tm_create_version (node);
5518 /* Redirect calls to the new clones, and insert irrevocable marks. */
5519 for (i = 0; i < tm_callees.length (); ++i)
5521 node = tm_callees[i];
5522 if (node->analyzed)
5524 d = get_cg_data (&node, true);
5525 if (d->clone)
5526 ipa_tm_transform_clone (node);
5529 FOR_EACH_DEFINED_FUNCTION (node)
5530 if (node->lowered
5531 && cgraph_function_body_availability (node) >= AVAIL_OVERWRITABLE)
5533 d = get_cg_data (&node, true);
5534 if (d->all_tm_regions)
5535 ipa_tm_transform_transaction (node);
5538 /* Free and clear all data structures. */
5539 tm_callees.release ();
5540 irr_worklist.release ();
5541 bitmap_obstack_release (&tm_obstack);
5542 free_original_copy_tables ();
5544 FOR_EACH_FUNCTION (node)
5545 node->aux = NULL;
5547 #ifdef ENABLE_CHECKING
5548 verify_cgraph ();
5549 #endif
5551 return 0;
5554 namespace {
5556 const pass_data pass_data_ipa_tm =
5558 SIMPLE_IPA_PASS, /* type */
5559 "tmipa", /* name */
5560 OPTGROUP_NONE, /* optinfo_flags */
5561 true, /* has_execute */
5562 TV_TRANS_MEM, /* tv_id */
5563 ( PROP_ssa | PROP_cfg ), /* properties_required */
5564 0, /* properties_provided */
5565 0, /* properties_destroyed */
5566 0, /* todo_flags_start */
5567 0, /* todo_flags_finish */
5570 class pass_ipa_tm : public simple_ipa_opt_pass
5572 public:
5573 pass_ipa_tm (gcc::context *ctxt)
5574 : simple_ipa_opt_pass (pass_data_ipa_tm, ctxt)
5577 /* opt_pass methods: */
5578 virtual bool gate (function *) { return flag_tm; }
5579 virtual unsigned int execute (function *) { return ipa_tm_execute (); }
5581 }; // class pass_ipa_tm
5583 } // anon namespace
5585 simple_ipa_opt_pass *
5586 make_pass_ipa_tm (gcc::context *ctxt)
5588 return new pass_ipa_tm (ctxt);
5591 #include "gt-trans-mem.h"