1 /* Pass for parsing functions with multiple target attributes.
3 Contributed by Evgeny Stupachenko <evstupac@gmail.com>
5 Copyright (C) 2015-2022 Free Software Foundation, Inc.
7 This file is part of GCC.
9 GCC is free software; you can redistribute it and/or modify it under
10 the terms of the GNU General Public License as published by the Free
11 Software Foundation; either version 3, or (at your option) any later
14 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
15 WARRANTY; without even the implied warranty of MERCHANTABILITY or
16 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
19 You should have received a copy of the GNU General Public License
20 along with GCC; see the file COPYING3. If not see
21 <http://www.gnu.org/licenses/>. */
25 #include "coretypes.h"
28 #include "stringpool.h"
30 #include "diagnostic-core.h"
31 #include "gimple-ssa.h"
33 #include "tree-pass.h"
36 #include "pretty-print.h"
37 #include "gimple-iterator.h"
38 #include "gimple-walk.h"
39 #include "tree-inline.h"
42 /* Walker callback that replaces all FUNCTION_DECL of a function that's
43 going to be versioned. */
46 replace_function_decl (tree
*op
, int *walk_subtrees
, void *data
)
48 struct walk_stmt_info
*wi
= (struct walk_stmt_info
*) data
;
49 cgraph_function_version_info
*info
= (cgraph_function_version_info
*)wi
->info
;
51 if (TREE_CODE (*op
) == FUNCTION_DECL
52 && info
->this_node
->decl
== *op
)
54 *op
= info
->dispatcher_resolver
;
61 /* If the call in NODE has multiple target attribute with multiple fields,
62 replace it with dispatcher call and create dispatcher (once). */
65 create_dispatcher_calls (struct cgraph_node
*node
)
69 if (!DECL_FUNCTION_VERSIONED (node
->decl
)
70 || !is_function_default_version (node
->decl
))
73 if (!targetm
.has_ifunc_p ())
75 error_at (DECL_SOURCE_LOCATION (node
->decl
),
76 "the call requires %<ifunc%>, which is not"
77 " supported by this target");
80 else if (!targetm
.get_function_versions_dispatcher
)
82 error_at (DECL_SOURCE_LOCATION (node
->decl
),
83 "target does not support function version dispatcher");
87 tree idecl
= targetm
.get_function_versions_dispatcher (node
->decl
);
90 error_at (DECL_SOURCE_LOCATION (node
->decl
),
91 "default %<target_clones%> attribute was not set");
95 cgraph_node
*inode
= cgraph_node::get (idecl
);
97 tree resolver_decl
= targetm
.generate_version_dispatcher_body (inode
);
101 inode
->alias_target
= resolver_decl
;
102 if (!inode
->analyzed
)
103 inode
->resolve_alias (cgraph_node::get (resolver_decl
));
105 auto_vec
<cgraph_edge
*> edges_to_redirect
;
106 /* We need to capture the references by value rather than just pointers to them
107 and remove them right away, as removing them later would invalidate what
108 some other reference pointers point to. */
109 auto_vec
<ipa_ref
> references_to_redirect
;
111 while (node
->iterate_referring (0, ref
))
113 references_to_redirect
.safe_push (*ref
);
114 ref
->remove_reference ();
117 /* We need to remember NEXT_CALLER as it could be modified in the loop. */
118 for (cgraph_edge
*e
= node
->callers
; e
; e
= e
->next_caller
)
119 edges_to_redirect
.safe_push (e
);
121 if (!edges_to_redirect
.is_empty () || !references_to_redirect
.is_empty ())
123 /* Redirect edges. */
126 FOR_EACH_VEC_ELT (edges_to_redirect
, i
, e
)
128 e
->redirect_callee (inode
);
129 cgraph_edge::redirect_call_stmt_to_callee (e
);
132 /* Redirect references. */
133 FOR_EACH_VEC_ELT (references_to_redirect
, i
, ref
)
135 if (ref
->use
== IPA_REF_ADDR
)
137 struct walk_stmt_info wi
;
138 memset (&wi
, 0, sizeof (wi
));
139 wi
.info
= (void *)node
->function_version ();
141 if (dyn_cast
<varpool_node
*> (ref
->referring
))
143 hash_set
<tree
> visited_nodes
;
144 walk_tree (&DECL_INITIAL (ref
->referring
->decl
),
145 replace_function_decl
, &wi
, &visited_nodes
);
149 gimple_stmt_iterator it
= gsi_for_stmt (ref
->stmt
);
150 if (ref
->referring
->decl
!= resolver_decl
)
151 walk_gimple_stmt (&it
, NULL
, replace_function_decl
, &wi
);
154 symtab_node
*source
= ref
->referring
;
155 source
->create_reference (inode
, IPA_REF_ADDR
);
157 else if (ref
->use
== IPA_REF_ALIAS
)
159 symtab_node
*source
= ref
->referring
;
160 source
->create_reference (inode
, IPA_REF_ALIAS
);
161 if (inode
->get_comdat_group ())
162 source
->add_to_same_comdat_group (inode
);
169 tree fname
= clone_function_name (node
->decl
, "default");
170 symtab
->change_decl_assembler_name (node
->decl
, fname
);
172 if (node
->definition
)
174 /* FIXME: copy of cgraph_node::make_local that should be cleaned up
176 node
->make_decl_local ();
177 node
->set_section (NULL
);
178 node
->set_comdat_group (NULL
);
179 node
->externally_visible
= false;
180 node
->forced_by_abi
= false;
181 node
->set_section (NULL
);
183 DECL_ARTIFICIAL (node
->decl
) = 1;
184 node
->force_output
= true;
188 /* Create string with attributes separated by comma.
189 Return number of attributes. */
192 get_attr_str (tree arglist
, char *attr_str
)
195 size_t str_len_sum
= 0;
198 for (arg
= arglist
; arg
; arg
= TREE_CHAIN (arg
))
200 const char *str
= TREE_STRING_POINTER (TREE_VALUE (arg
));
201 size_t len
= strlen (str
);
202 for (const char *p
= strchr (str
, ','); p
; p
= strchr (p
+ 1, ','))
204 memcpy (attr_str
+ str_len_sum
, str
, len
);
205 attr_str
[str_len_sum
+ len
] = TREE_CHAIN (arg
) ? ',' : '\0';
206 str_len_sum
+= len
+ 1;
212 /* Return number of attributes separated by comma and put them into ARGS.
213 If there is no DEFAULT attribute return -1.
214 If there is an empty string in attribute return -2.
215 If there are multiple DEFAULT attributes return -3.
219 separate_attrs (char *attr_str
, char **attrs
, int attrnum
)
222 int default_count
= 0;
224 for (char *attr
= strtok (attr_str
, ",");
225 attr
!= NULL
; attr
= strtok (NULL
, ","))
227 if (strcmp (attr
, "default") == 0)
234 if (default_count
== 0)
236 else if (default_count
> 1)
238 else if (i
+ default_count
< attrnum
)
244 /* Return true if symbol is valid in assembler name. */
247 is_valid_asm_symbol (char c
)
249 if ('a' <= c
&& c
<= 'z')
251 if ('A' <= c
&& c
<= 'Z')
253 if ('0' <= c
&& c
<= '9')
260 /* Replace all not valid assembler symbols with '_'. */
263 create_new_asm_name (char *old_asm_name
, char *new_asm_name
)
266 int old_name_len
= strlen (old_asm_name
);
268 /* Replace all not valid assembler symbols with '_'. */
269 for (i
= 0; i
< old_name_len
; i
++)
270 if (!is_valid_asm_symbol (old_asm_name
[i
]))
271 new_asm_name
[i
] = '_';
273 new_asm_name
[i
] = old_asm_name
[i
];
274 new_asm_name
[old_name_len
] = '\0';
277 /* Creates target clone of NODE. */
280 create_target_clone (cgraph_node
*node
, bool definition
, char *name
,
283 cgraph_node
*new_node
;
288 = node
->create_version_clone_with_body (vNULL
, NULL
, NULL
, NULL
, NULL
,
289 name
, attributes
, false);
290 if (new_node
== NULL
)
292 new_node
->force_output
= true;
296 tree new_decl
= copy_node (node
->decl
);
297 new_node
= cgraph_node::get_create (new_decl
);
298 DECL_ATTRIBUTES (new_decl
) = attributes
;
299 /* Generate a new name for the new version. */
300 tree fname
= clone_function_name (node
->decl
, name
);
301 symtab
->change_decl_assembler_name (new_node
->decl
, fname
);
306 /* If the function in NODE has multiple target attributes
307 create the appropriate clone for each valid target attribute. */
310 expand_target_clones (struct cgraph_node
*node
, bool definition
)
313 /* Parsing target attributes separated by comma. */
314 tree attr_target
= lookup_attribute ("target_clones",
315 DECL_ATTRIBUTES (node
->decl
));
316 /* No targets specified. */
320 tree arglist
= TREE_VALUE (attr_target
);
321 int attr_len
= get_target_clone_attr_len (arglist
);
323 /* No need to clone for 1 target attribute. */
326 warning_at (DECL_SOURCE_LOCATION (node
->decl
),
327 0, "single %<target_clones%> attribute is ignored");
332 && (node
->alias
|| !tree_versionable_function_p (node
->decl
)))
334 auto_diagnostic_group d
;
335 error_at (DECL_SOURCE_LOCATION (node
->decl
),
336 "clones for %<target_clones%> attribute cannot be created");
337 const char *reason
= NULL
;
338 if (lookup_attribute ("noclone", DECL_ATTRIBUTES (node
->decl
)))
339 reason
= G_("function %q+F can never be copied "
340 "because it has %<noclone%> attribute");
341 else if (node
->alias
)
343 = "%<target_clones%> cannot be combined with %<alias%> attribute";
345 reason
= copy_forbidden (DECL_STRUCT_FUNCTION (node
->decl
));
347 inform (DECL_SOURCE_LOCATION (node
->decl
), reason
, node
->decl
);
351 char *attr_str
= XNEWVEC (char, attr_len
);
352 int attrnum
= get_attr_str (arglist
, attr_str
);
353 char **attrs
= XNEWVEC (char *, attrnum
);
355 attrnum
= separate_attrs (attr_str
, attrs
, attrnum
);
359 error_at (DECL_SOURCE_LOCATION (node
->decl
),
360 "%<default%> target was not set");
363 error_at (DECL_SOURCE_LOCATION (node
->decl
),
364 "an empty string cannot be in %<target_clones%> attribute");
367 error_at (DECL_SOURCE_LOCATION (node
->decl
),
368 "multiple %<default%> targets were set");
377 XDELETEVEC (attr_str
);
381 cgraph_function_version_info
*decl1_v
= NULL
;
382 cgraph_function_version_info
*decl2_v
= NULL
;
383 cgraph_function_version_info
*before
= NULL
;
384 cgraph_function_version_info
*after
= NULL
;
385 decl1_v
= node
->function_version ();
387 decl1_v
= node
->insert_new_function_version ();
389 DECL_FUNCTION_VERSIONED (node
->decl
) = 1;
391 for (i
= 0; i
< attrnum
; i
++)
393 char *attr
= attrs
[i
];
394 char *suffix
= XNEWVEC (char, strlen (attr
) + 1);
396 create_new_asm_name (attr
, suffix
);
397 /* Create new target clone. */
398 tree attributes
= make_attribute ("target", attr
,
399 DECL_ATTRIBUTES (node
->decl
));
401 cgraph_node
*new_node
= create_target_clone (node
, definition
, suffix
,
403 if (new_node
== NULL
)
405 new_node
->local
= false;
408 decl2_v
= new_node
->function_version ();
411 decl2_v
= new_node
->insert_new_function_version ();
413 /* Chain decl2_v and decl1_v. All semantically identical versions
414 will be chained together. */
416 while (before
->next
!= NULL
)
417 before
= before
->next
;
418 while (after
->prev
!= NULL
)
421 before
->next
= after
;
422 after
->prev
= before
;
423 DECL_FUNCTION_VERSIONED (new_node
->decl
) = 1;
427 XDELETEVEC (attr_str
);
429 /* Setting new attribute to initial function. */
430 tree attributes
= make_attribute ("target", "default",
431 DECL_ATTRIBUTES (node
->decl
));
432 DECL_ATTRIBUTES (node
->decl
) = attributes
;
437 /* When NODE is a target clone, consider all callees and redirect
438 to a clone with equal target attributes. That prevents multiple
439 multi-versioning dispatches and a call-chain can be optimized. */
442 redirect_to_specific_clone (cgraph_node
*node
)
444 cgraph_function_version_info
*fv
= node
->function_version ();
448 tree attr_target
= lookup_attribute ("target", DECL_ATTRIBUTES (node
->decl
));
449 if (attr_target
== NULL_TREE
)
452 /* We need to remember NEXT_CALLER as it could be modified in the loop. */
453 for (cgraph_edge
*e
= node
->callees
; e
; e
= e
->next_callee
)
455 cgraph_function_version_info
*fv2
= e
->callee
->function_version ();
459 tree attr_target2
= lookup_attribute ("target",
460 DECL_ATTRIBUTES (e
->callee
->decl
));
462 /* Function is not calling proper target clone. */
463 if (attr_target2
== NULL_TREE
464 || !attribute_value_equal (attr_target
, attr_target2
))
466 while (fv2
->prev
!= NULL
)
469 /* Try to find a clone with equal target attribute. */
470 for (; fv2
!= NULL
; fv2
= fv2
->next
)
472 cgraph_node
*callee
= fv2
->this_node
;
473 attr_target2
= lookup_attribute ("target",
474 DECL_ATTRIBUTES (callee
->decl
));
475 if (attr_target2
!= NULL_TREE
476 && attribute_value_equal (attr_target
, attr_target2
))
478 e
->redirect_callee (callee
);
479 cgraph_edge::redirect_call_stmt_to_callee (e
);
488 ipa_target_clone (void)
490 struct cgraph_node
*node
;
491 auto_vec
<cgraph_node
*> to_dispatch
;
493 FOR_EACH_FUNCTION (node
)
494 if (expand_target_clones (node
, node
->definition
))
495 to_dispatch
.safe_push (node
);
497 for (unsigned i
= 0; i
< to_dispatch
.length (); i
++)
498 create_dispatcher_calls (to_dispatch
[i
]);
500 FOR_EACH_FUNCTION (node
)
501 redirect_to_specific_clone (node
);
508 const pass_data pass_data_target_clone
=
510 SIMPLE_IPA_PASS
, /* type */
511 "targetclone", /* name */
512 OPTGROUP_NONE
, /* optinfo_flags */
514 ( PROP_ssa
| PROP_cfg
), /* properties_required */
515 0, /* properties_provided */
516 0, /* properties_destroyed */
517 0, /* todo_flags_start */
518 TODO_update_ssa
/* todo_flags_finish */
521 class pass_target_clone
: public simple_ipa_opt_pass
524 pass_target_clone (gcc::context
*ctxt
)
525 : simple_ipa_opt_pass (pass_data_target_clone
, ctxt
)
528 /* opt_pass methods: */
529 bool gate (function
*) final override
;
530 unsigned int execute (function
*) final override
532 return ipa_target_clone ();
537 pass_target_clone::gate (function
*)
544 simple_ipa_opt_pass
*
545 make_pass_target_clone (gcc::context
*ctxt
)
547 return new pass_target_clone (ctxt
);