2018-06-09 Steven G. Kargl <kargl@gcc.gnu.org>
[official-gcc.git] / gcc / fortran / frontend-passes.c
blobc13366cf138276fc3817d1a38b5ea1d6930954a9
1 /* Pass manager for Fortran front end.
2 Copyright (C) 2010-2018 Free Software Foundation, Inc.
3 Contributed by Thomas König.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
21 #include "config.h"
22 #include "system.h"
23 #include "coretypes.h"
24 #include "options.h"
25 #include "gfortran.h"
26 #include "dependency.h"
27 #include "constructor.h"
28 #include "intrinsic.h"
30 /* Forward declarations. */
32 static void strip_function_call (gfc_expr *);
33 static void optimize_namespace (gfc_namespace *);
34 static void optimize_assignment (gfc_code *);
35 static bool optimize_op (gfc_expr *);
36 static bool optimize_comparison (gfc_expr *, gfc_intrinsic_op);
37 static bool optimize_trim (gfc_expr *);
38 static bool optimize_lexical_comparison (gfc_expr *);
39 static void optimize_minmaxloc (gfc_expr **);
40 static bool is_empty_string (gfc_expr *e);
41 static void doloop_warn (gfc_namespace *);
42 static int do_intent (gfc_expr **);
43 static int do_subscript (gfc_expr **);
44 static void optimize_reduction (gfc_namespace *);
45 static int callback_reduction (gfc_expr **, int *, void *);
46 static void realloc_strings (gfc_namespace *);
47 static gfc_expr *create_var (gfc_expr *, const char *vname=NULL);
48 static int matmul_to_var_expr (gfc_expr **, int *, void *);
49 static int matmul_to_var_code (gfc_code **, int *, void *);
50 static int inline_matmul_assign (gfc_code **, int *, void *);
51 static gfc_code * create_do_loop (gfc_expr *, gfc_expr *, gfc_expr *,
52 locus *, gfc_namespace *,
53 char *vname=NULL);
54 static gfc_expr* check_conjg_transpose_variable (gfc_expr *, bool *,
55 bool *);
56 static bool has_dimen_vector_ref (gfc_expr *);
57 static int matmul_temp_args (gfc_code **, int *,void *data);
58 static int index_interchange (gfc_code **, int*, void *);
60 static bool is_fe_temp (gfc_expr *e);
62 #ifdef CHECKING_P
63 static void check_locus (gfc_namespace *);
64 #endif
66 /* How deep we are inside an argument list. */
68 static int count_arglist;
70 /* Vector of gfc_expr ** we operate on. */
72 static vec<gfc_expr **> expr_array;
74 /* Pointer to the gfc_code we currently work on - to be able to insert
75 a block before the statement. */
77 static gfc_code **current_code;
79 /* Pointer to the block to be inserted, and the statement we are
80 changing within the block. */
82 static gfc_code *inserted_block, **changed_statement;
84 /* The namespace we are currently dealing with. */
86 static gfc_namespace *current_ns;
88 /* If we are within any forall loop. */
90 static int forall_level;
92 /* Keep track of whether we are within an OMP workshare. */
94 static bool in_omp_workshare;
96 /* Keep track of whether we are within a WHERE statement. */
98 static bool in_where;
100 /* Keep track of iterators for array constructors. */
102 static int iterator_level;
104 /* Keep track of DO loop levels. */
106 typedef struct {
107 gfc_code *c;
108 int branch_level;
109 bool seen_goto;
110 } do_t;
112 static vec<do_t> doloop_list;
113 static int doloop_level;
115 /* Keep track of if and select case levels. */
117 static int if_level;
118 static int select_level;
120 /* Vector of gfc_expr * to keep track of DO loops. */
122 struct my_struct *evec;
124 /* Keep track of association lists. */
126 static bool in_assoc_list;
128 /* Counter for temporary variables. */
130 static int var_num = 1;
132 /* What sort of matrix we are dealing with when inlining MATMUL. */
134 enum matrix_case { none=0, A2B2, A2B1, A1B2, A2B2T, A2TB2 };
136 /* Keep track of the number of expressions we have inserted so far
137 using create_var. */
139 int n_vars;
141 /* Entry point - run all passes for a namespace. */
143 void
144 gfc_run_passes (gfc_namespace *ns)
147 /* Warn about dubious DO loops where the index might
148 change. */
150 doloop_level = 0;
151 if_level = 0;
152 select_level = 0;
153 doloop_warn (ns);
154 doloop_list.release ();
155 int w, e;
157 #ifdef CHECKING_P
158 check_locus (ns);
159 #endif
161 gfc_get_errors (&w, &e);
162 if (e > 0)
163 return;
165 if (flag_frontend_optimize || flag_frontend_loop_interchange)
166 optimize_namespace (ns);
168 if (flag_frontend_optimize)
170 optimize_reduction (ns);
171 if (flag_dump_fortran_optimized)
172 gfc_dump_parse_tree (ns, stdout);
174 expr_array.release ();
177 if (flag_realloc_lhs)
178 realloc_strings (ns);
181 #ifdef CHECKING_P
183 /* Callback function: Warn if there is no location information in a
184 statement. */
186 static int
187 check_locus_code (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
188 void *data ATTRIBUTE_UNUSED)
190 current_code = c;
191 if (c && *c && (((*c)->loc.nextc == NULL) || ((*c)->loc.lb == NULL)))
192 gfc_warning_internal (0, "No location in statement");
194 return 0;
198 /* Callback function: Warn if there is no location information in an
199 expression. */
201 static int
202 check_locus_expr (gfc_expr **e, int *walk_subtrees ATTRIBUTE_UNUSED,
203 void *data ATTRIBUTE_UNUSED)
206 if (e && *e && (((*e)->where.nextc == NULL || (*e)->where.lb == NULL)))
207 gfc_warning_internal (0, "No location in expression near %L",
208 &((*current_code)->loc));
209 return 0;
212 /* Run check for missing location information. */
214 static void
215 check_locus (gfc_namespace *ns)
217 gfc_code_walker (&ns->code, check_locus_code, check_locus_expr, NULL);
219 for (ns = ns->contained; ns; ns = ns->sibling)
221 if (ns->code == NULL || ns->code->op != EXEC_BLOCK)
222 check_locus (ns);
226 #endif
228 /* Callback for each gfc_code node invoked from check_realloc_strings.
229 For an allocatable LHS string which also appears as a variable on
230 the RHS, replace
232 a = a(x:y)
234 with
236 tmp = a(x:y)
237 a = tmp
240 static int
241 realloc_string_callback (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
242 void *data ATTRIBUTE_UNUSED)
244 gfc_expr *expr1, *expr2;
245 gfc_code *co = *c;
246 gfc_expr *n;
247 gfc_ref *ref;
248 bool found_substr;
250 if (co->op != EXEC_ASSIGN)
251 return 0;
253 expr1 = co->expr1;
254 if (expr1->ts.type != BT_CHARACTER
255 || !gfc_expr_attr(expr1).allocatable
256 || !expr1->ts.deferred)
257 return 0;
259 if (is_fe_temp (expr1))
260 return 0;
262 expr2 = gfc_discard_nops (co->expr2);
264 if (expr2->expr_type == EXPR_VARIABLE)
266 found_substr = false;
267 for (ref = expr2->ref; ref; ref = ref->next)
269 if (ref->type == REF_SUBSTRING)
271 found_substr = true;
272 break;
275 if (!found_substr)
276 return 0;
278 else if (expr2->expr_type != EXPR_ARRAY
279 && (expr2->expr_type != EXPR_OP
280 || expr2->value.op.op != INTRINSIC_CONCAT))
281 return 0;
283 if (!gfc_check_dependency (expr1, expr2, true))
284 return 0;
286 /* gfc_check_dependency doesn't always pick up identical expressions.
287 However, eliminating the above sends the compiler into an infinite
288 loop on valid expressions. Without this check, the gimplifier emits
289 an ICE for a = a, where a is deferred character length. */
290 if (!gfc_dep_compare_expr (expr1, expr2))
291 return 0;
293 current_code = c;
294 inserted_block = NULL;
295 changed_statement = NULL;
296 n = create_var (expr2, "realloc_string");
297 co->expr2 = n;
298 return 0;
301 /* Callback for each gfc_code node invoked through gfc_code_walker
302 from optimize_namespace. */
304 static int
305 optimize_code (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
306 void *data ATTRIBUTE_UNUSED)
309 gfc_exec_op op;
311 op = (*c)->op;
313 if (op == EXEC_CALL || op == EXEC_COMPCALL || op == EXEC_ASSIGN_CALL
314 || op == EXEC_CALL_PPC)
315 count_arglist = 1;
316 else
317 count_arglist = 0;
319 current_code = c;
320 inserted_block = NULL;
321 changed_statement = NULL;
323 if (op == EXEC_ASSIGN)
324 optimize_assignment (*c);
325 return 0;
328 /* Callback for each gfc_expr node invoked through gfc_code_walker
329 from optimize_namespace. */
331 static int
332 optimize_expr (gfc_expr **e, int *walk_subtrees ATTRIBUTE_UNUSED,
333 void *data ATTRIBUTE_UNUSED)
335 bool function_expr;
337 if ((*e)->expr_type == EXPR_FUNCTION)
339 count_arglist ++;
340 function_expr = true;
342 else
343 function_expr = false;
345 if (optimize_trim (*e))
346 gfc_simplify_expr (*e, 0);
348 if (optimize_lexical_comparison (*e))
349 gfc_simplify_expr (*e, 0);
351 if ((*e)->expr_type == EXPR_OP && optimize_op (*e))
352 gfc_simplify_expr (*e, 0);
354 if ((*e)->expr_type == EXPR_FUNCTION && (*e)->value.function.isym)
355 switch ((*e)->value.function.isym->id)
357 case GFC_ISYM_MINLOC:
358 case GFC_ISYM_MAXLOC:
359 optimize_minmaxloc (e);
360 break;
361 default:
362 break;
365 if (function_expr)
366 count_arglist --;
368 return 0;
371 /* Auxiliary function to handle the arguments to reduction intrnisics. If the
372 function is a scalar, just copy it; otherwise returns the new element, the
373 old one can be freed. */
375 static gfc_expr *
376 copy_walk_reduction_arg (gfc_constructor *c, gfc_expr *fn)
378 gfc_expr *fcn, *e = c->expr;
380 fcn = gfc_copy_expr (e);
381 if (c->iterator)
383 gfc_constructor_base newbase;
384 gfc_expr *new_expr;
385 gfc_constructor *new_c;
387 newbase = NULL;
388 new_expr = gfc_get_expr ();
389 new_expr->expr_type = EXPR_ARRAY;
390 new_expr->ts = e->ts;
391 new_expr->where = e->where;
392 new_expr->rank = 1;
393 new_c = gfc_constructor_append_expr (&newbase, fcn, &(e->where));
394 new_c->iterator = c->iterator;
395 new_expr->value.constructor = newbase;
396 c->iterator = NULL;
398 fcn = new_expr;
401 if (fcn->rank != 0)
403 gfc_isym_id id = fn->value.function.isym->id;
405 if (id == GFC_ISYM_SUM || id == GFC_ISYM_PRODUCT)
406 fcn = gfc_build_intrinsic_call (current_ns, id,
407 fn->value.function.isym->name,
408 fn->where, 3, fcn, NULL, NULL);
409 else if (id == GFC_ISYM_ANY || id == GFC_ISYM_ALL)
410 fcn = gfc_build_intrinsic_call (current_ns, id,
411 fn->value.function.isym->name,
412 fn->where, 2, fcn, NULL);
413 else
414 gfc_internal_error ("Illegal id in copy_walk_reduction_arg");
416 fcn->symtree->n.sym->attr.access = ACCESS_PRIVATE;
419 return fcn;
422 /* Callback function for optimzation of reductions to scalars. Transform ANY
423 ([f1,f2,f3, ...]) to f1 .or. f2 .or. f3 .or. ..., with ANY, SUM and PRODUCT
424 correspondingly. Handly only the simple cases without MASK and DIM. */
426 static int
427 callback_reduction (gfc_expr **e, int *walk_subtrees ATTRIBUTE_UNUSED,
428 void *data ATTRIBUTE_UNUSED)
430 gfc_expr *fn, *arg;
431 gfc_intrinsic_op op;
432 gfc_isym_id id;
433 gfc_actual_arglist *a;
434 gfc_actual_arglist *dim;
435 gfc_constructor *c;
436 gfc_expr *res, *new_expr;
437 gfc_actual_arglist *mask;
439 fn = *e;
441 if (fn->rank != 0 || fn->expr_type != EXPR_FUNCTION
442 || fn->value.function.isym == NULL)
443 return 0;
445 id = fn->value.function.isym->id;
447 if (id != GFC_ISYM_SUM && id != GFC_ISYM_PRODUCT
448 && id != GFC_ISYM_ANY && id != GFC_ISYM_ALL)
449 return 0;
451 a = fn->value.function.actual;
453 /* Don't handle MASK or DIM. */
455 dim = a->next;
457 if (dim->expr != NULL)
458 return 0;
460 if (id == GFC_ISYM_SUM || id == GFC_ISYM_PRODUCT)
462 mask = dim->next;
463 if ( mask->expr != NULL)
464 return 0;
467 arg = a->expr;
469 if (arg->expr_type != EXPR_ARRAY)
470 return 0;
472 switch (id)
474 case GFC_ISYM_SUM:
475 op = INTRINSIC_PLUS;
476 break;
478 case GFC_ISYM_PRODUCT:
479 op = INTRINSIC_TIMES;
480 break;
482 case GFC_ISYM_ANY:
483 op = INTRINSIC_OR;
484 break;
486 case GFC_ISYM_ALL:
487 op = INTRINSIC_AND;
488 break;
490 default:
491 return 0;
494 c = gfc_constructor_first (arg->value.constructor);
496 /* Don't do any simplififcation if we have
497 - no element in the constructor or
498 - only have a single element in the array which contains an
499 iterator. */
501 if (c == NULL)
502 return 0;
504 res = copy_walk_reduction_arg (c, fn);
506 c = gfc_constructor_next (c);
507 while (c)
509 new_expr = gfc_get_expr ();
510 new_expr->ts = fn->ts;
511 new_expr->expr_type = EXPR_OP;
512 new_expr->rank = fn->rank;
513 new_expr->where = fn->where;
514 new_expr->value.op.op = op;
515 new_expr->value.op.op1 = res;
516 new_expr->value.op.op2 = copy_walk_reduction_arg (c, fn);
517 res = new_expr;
518 c = gfc_constructor_next (c);
521 gfc_simplify_expr (res, 0);
522 *e = res;
523 gfc_free_expr (fn);
525 return 0;
528 /* Callback function for common function elimination, called from cfe_expr_0.
529 Put all eligible function expressions into expr_array. */
531 static int
532 cfe_register_funcs (gfc_expr **e, int *walk_subtrees ATTRIBUTE_UNUSED,
533 void *data ATTRIBUTE_UNUSED)
536 if ((*e)->expr_type != EXPR_FUNCTION)
537 return 0;
539 /* We don't do character functions with unknown charlens. */
540 if ((*e)->ts.type == BT_CHARACTER
541 && ((*e)->ts.u.cl == NULL || (*e)->ts.u.cl->length == NULL
542 || (*e)->ts.u.cl->length->expr_type != EXPR_CONSTANT))
543 return 0;
545 /* We don't do function elimination within FORALL statements, it can
546 lead to wrong-code in certain circumstances. */
548 if (forall_level > 0)
549 return 0;
551 /* Function elimination inside an iterator could lead to functions which
552 depend on iterator variables being moved outside. FIXME: We should check
553 if the functions do indeed depend on the iterator variable. */
555 if (iterator_level > 0)
556 return 0;
558 /* If we don't know the shape at compile time, we create an allocatable
559 temporary variable to hold the intermediate result, but only if
560 allocation on assignment is active. */
562 if ((*e)->rank > 0 && (*e)->shape == NULL && !flag_realloc_lhs)
563 return 0;
565 /* Skip the test for pure functions if -faggressive-function-elimination
566 is specified. */
567 if ((*e)->value.function.esym)
569 /* Don't create an array temporary for elemental functions. */
570 if ((*e)->value.function.esym->attr.elemental && (*e)->rank > 0)
571 return 0;
573 /* Only eliminate potentially impure functions if the
574 user specifically requested it. */
575 if (!flag_aggressive_function_elimination
576 && !(*e)->value.function.esym->attr.pure
577 && !(*e)->value.function.esym->attr.implicit_pure)
578 return 0;
581 if ((*e)->value.function.isym)
583 /* Conversions are handled on the fly by the middle end,
584 transpose during trans-* stages and TRANSFER by the middle end. */
585 if ((*e)->value.function.isym->id == GFC_ISYM_CONVERSION
586 || (*e)->value.function.isym->id == GFC_ISYM_TRANSFER
587 || gfc_inline_intrinsic_function_p (*e))
588 return 0;
590 /* Don't create an array temporary for elemental functions,
591 as this would be wasteful of memory.
592 FIXME: Create a scalar temporary during scalarization. */
593 if ((*e)->value.function.isym->elemental && (*e)->rank > 0)
594 return 0;
596 if (!(*e)->value.function.isym->pure)
597 return 0;
600 expr_array.safe_push (e);
601 return 0;
604 /* Auxiliary function to check if an expression is a temporary created by
605 create var. */
607 static bool
608 is_fe_temp (gfc_expr *e)
610 if (e->expr_type != EXPR_VARIABLE)
611 return false;
613 return e->symtree->n.sym->attr.fe_temp;
616 /* Determine the length of a string, if it can be evaluated as a constant
617 expression. Return a newly allocated gfc_expr or NULL on failure.
618 If the user specified a substring which is potentially longer than
619 the string itself, the string will be padded with spaces, which
620 is harmless. */
622 static gfc_expr *
623 constant_string_length (gfc_expr *e)
626 gfc_expr *length;
627 gfc_ref *ref;
628 gfc_expr *res;
629 mpz_t value;
631 if (e->ts.u.cl)
633 length = e->ts.u.cl->length;
634 if (length && length->expr_type == EXPR_CONSTANT)
635 return gfc_copy_expr(length);
638 /* Return length of substring, if constant. */
639 for (ref = e->ref; ref; ref = ref->next)
641 if (ref->type == REF_SUBSTRING
642 && gfc_dep_difference (ref->u.ss.end, ref->u.ss.start, &value))
644 res = gfc_get_constant_expr (BT_INTEGER, gfc_charlen_int_kind,
645 &e->where);
647 mpz_add_ui (res->value.integer, value, 1);
648 mpz_clear (value);
649 return res;
653 /* Return length of char symbol, if constant. */
655 if (e->symtree && e->symtree->n.sym->ts.u.cl
656 && e->symtree->n.sym->ts.u.cl->length
657 && e->symtree->n.sym->ts.u.cl->length->expr_type == EXPR_CONSTANT)
658 return gfc_copy_expr (e->symtree->n.sym->ts.u.cl->length);
660 return NULL;
664 /* Insert a block at the current position unless it has already
665 been inserted; in this case use the one already there. */
667 static gfc_namespace*
668 insert_block ()
670 gfc_namespace *ns;
672 /* If the block hasn't already been created, do so. */
673 if (inserted_block == NULL)
675 inserted_block = XCNEW (gfc_code);
676 inserted_block->op = EXEC_BLOCK;
677 inserted_block->loc = (*current_code)->loc;
678 ns = gfc_build_block_ns (current_ns);
679 inserted_block->ext.block.ns = ns;
680 inserted_block->ext.block.assoc = NULL;
682 ns->code = *current_code;
684 /* If the statement has a label, make sure it is transferred to
685 the newly created block. */
687 if ((*current_code)->here)
689 inserted_block->here = (*current_code)->here;
690 (*current_code)->here = NULL;
693 inserted_block->next = (*current_code)->next;
694 changed_statement = &(inserted_block->ext.block.ns->code);
695 (*current_code)->next = NULL;
696 /* Insert the BLOCK at the right position. */
697 *current_code = inserted_block;
698 ns->parent = current_ns;
700 else
701 ns = inserted_block->ext.block.ns;
703 return ns;
706 /* Returns a new expression (a variable) to be used in place of the old one,
707 with an optional assignment statement before the current statement to set
708 the value of the variable. Creates a new BLOCK for the statement if that
709 hasn't already been done and puts the statement, plus the newly created
710 variables, in that block. Special cases: If the expression is constant or
711 a temporary which has already been created, just copy it. */
713 static gfc_expr*
714 create_var (gfc_expr * e, const char *vname)
716 char name[GFC_MAX_SYMBOL_LEN +1];
717 gfc_symtree *symtree;
718 gfc_symbol *symbol;
719 gfc_expr *result;
720 gfc_code *n;
721 gfc_namespace *ns;
722 int i;
723 bool deferred;
725 if (e->expr_type == EXPR_CONSTANT || is_fe_temp (e))
726 return gfc_copy_expr (e);
728 /* Creation of an array of unknown size requires realloc on assignment.
729 If that is not possible, just return NULL. */
730 if (flag_realloc_lhs == 0 && e->rank > 0 && e->shape == NULL)
731 return NULL;
733 ns = insert_block ();
735 if (vname)
736 snprintf (name, GFC_MAX_SYMBOL_LEN, "__var_%d_%s", var_num++, vname);
737 else
738 snprintf (name, GFC_MAX_SYMBOL_LEN, "__var_%d", var_num++);
740 if (gfc_get_sym_tree (name, ns, &symtree, false) != 0)
741 gcc_unreachable ();
743 symbol = symtree->n.sym;
744 symbol->ts = e->ts;
746 if (e->rank > 0)
748 symbol->as = gfc_get_array_spec ();
749 symbol->as->rank = e->rank;
751 if (e->shape == NULL)
753 /* We don't know the shape at compile time, so we use an
754 allocatable. */
755 symbol->as->type = AS_DEFERRED;
756 symbol->attr.allocatable = 1;
758 else
760 symbol->as->type = AS_EXPLICIT;
761 /* Copy the shape. */
762 for (i=0; i<e->rank; i++)
764 gfc_expr *p, *q;
766 p = gfc_get_constant_expr (BT_INTEGER, gfc_default_integer_kind,
767 &(e->where));
768 mpz_set_si (p->value.integer, 1);
769 symbol->as->lower[i] = p;
771 q = gfc_get_constant_expr (BT_INTEGER, gfc_index_integer_kind,
772 &(e->where));
773 mpz_set (q->value.integer, e->shape[i]);
774 symbol->as->upper[i] = q;
779 deferred = 0;
780 if (e->ts.type == BT_CHARACTER)
782 gfc_expr *length;
784 symbol->ts.u.cl = gfc_new_charlen (ns, NULL);
785 length = constant_string_length (e);
786 if (length)
787 symbol->ts.u.cl->length = length;
788 else
790 symbol->attr.allocatable = 1;
791 symbol->ts.u.cl->length = NULL;
792 symbol->ts.deferred = 1;
793 deferred = 1;
797 symbol->attr.flavor = FL_VARIABLE;
798 symbol->attr.referenced = 1;
799 symbol->attr.dimension = e->rank > 0;
800 symbol->attr.fe_temp = 1;
801 gfc_commit_symbol (symbol);
803 result = gfc_get_expr ();
804 result->expr_type = EXPR_VARIABLE;
805 result->ts = symbol->ts;
806 result->ts.deferred = deferred;
807 result->rank = e->rank;
808 result->shape = gfc_copy_shape (e->shape, e->rank);
809 result->symtree = symtree;
810 result->where = e->where;
811 if (e->rank > 0)
813 result->ref = gfc_get_ref ();
814 result->ref->type = REF_ARRAY;
815 result->ref->u.ar.type = AR_FULL;
816 result->ref->u.ar.where = e->where;
817 result->ref->u.ar.dimen = e->rank;
818 result->ref->u.ar.as = symbol->ts.type == BT_CLASS
819 ? CLASS_DATA (symbol)->as : symbol->as;
820 if (warn_array_temporaries)
821 gfc_warning (OPT_Warray_temporaries,
822 "Creating array temporary at %L", &(e->where));
825 /* Generate the new assignment. */
826 n = XCNEW (gfc_code);
827 n->op = EXEC_ASSIGN;
828 n->loc = (*current_code)->loc;
829 n->next = *changed_statement;
830 n->expr1 = gfc_copy_expr (result);
831 n->expr2 = e;
832 *changed_statement = n;
833 n_vars ++;
835 return result;
838 /* Warn about function elimination. */
840 static void
841 do_warn_function_elimination (gfc_expr *e)
843 if (e->expr_type != EXPR_FUNCTION)
844 return;
845 if (e->value.function.esym)
846 gfc_warning (OPT_Wfunction_elimination,
847 "Removing call to function %qs at %L",
848 e->value.function.esym->name, &(e->where));
849 else if (e->value.function.isym)
850 gfc_warning (OPT_Wfunction_elimination,
851 "Removing call to function %qs at %L",
852 e->value.function.isym->name, &(e->where));
854 /* Callback function for the code walker for doing common function
855 elimination. This builds up the list of functions in the expression
856 and goes through them to detect duplicates, which it then replaces
857 by variables. */
859 static int
860 cfe_expr_0 (gfc_expr **e, int *walk_subtrees,
861 void *data ATTRIBUTE_UNUSED)
863 int i,j;
864 gfc_expr *newvar;
865 gfc_expr **ei, **ej;
867 /* Don't do this optimization within OMP workshare or ASSOC lists. */
869 if (in_omp_workshare || in_assoc_list)
871 *walk_subtrees = 0;
872 return 0;
875 expr_array.release ();
877 gfc_expr_walker (e, cfe_register_funcs, NULL);
879 /* Walk through all the functions. */
881 FOR_EACH_VEC_ELT_FROM (expr_array, i, ei, 1)
883 /* Skip if the function has been replaced by a variable already. */
884 if ((*ei)->expr_type == EXPR_VARIABLE)
885 continue;
887 newvar = NULL;
888 for (j=0; j<i; j++)
890 ej = expr_array[j];
891 if (gfc_dep_compare_functions (*ei, *ej, true) == 0)
893 if (newvar == NULL)
894 newvar = create_var (*ei, "fcn");
896 if (warn_function_elimination)
897 do_warn_function_elimination (*ej);
899 free (*ej);
900 *ej = gfc_copy_expr (newvar);
903 if (newvar)
904 *ei = newvar;
907 /* We did all the necessary walking in this function. */
908 *walk_subtrees = 0;
909 return 0;
912 /* Callback function for common function elimination, called from
913 gfc_code_walker. This keeps track of the current code, in order
914 to insert statements as needed. */
916 static int
917 cfe_code (gfc_code **c, int *walk_subtrees, void *data ATTRIBUTE_UNUSED)
919 current_code = c;
920 inserted_block = NULL;
921 changed_statement = NULL;
923 /* Do not do anything inside a WHERE statement; scalar assignments, BLOCKs
924 and allocation on assigment are prohibited inside WHERE, and finally
925 masking an expression would lead to wrong-code when replacing
927 WHERE (a>0)
928 b = sum(foo(a) + foo(a))
929 END WHERE
931 with
933 WHERE (a > 0)
934 tmp = foo(a)
935 b = sum(tmp + tmp)
936 END WHERE
939 if ((*c)->op == EXEC_WHERE)
941 *walk_subtrees = 0;
942 return 0;
946 return 0;
949 /* Dummy function for expression call back, for use when we
950 really don't want to do any walking. */
952 static int
953 dummy_expr_callback (gfc_expr **e ATTRIBUTE_UNUSED, int *walk_subtrees,
954 void *data ATTRIBUTE_UNUSED)
956 *walk_subtrees = 0;
957 return 0;
960 /* Dummy function for code callback, for use when we really
961 don't want to do anything. */
963 gfc_dummy_code_callback (gfc_code **e ATTRIBUTE_UNUSED,
964 int *walk_subtrees ATTRIBUTE_UNUSED,
965 void *data ATTRIBUTE_UNUSED)
967 return 0;
970 /* Code callback function for converting
971 do while(a)
972 end do
973 into the equivalent
975 if (.not. a) exit
976 end do
977 This is because common function elimination would otherwise place the
978 temporary variables outside the loop. */
980 static int
981 convert_do_while (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
982 void *data ATTRIBUTE_UNUSED)
984 gfc_code *co = *c;
985 gfc_code *c_if1, *c_if2, *c_exit;
986 gfc_code *loopblock;
987 gfc_expr *e_not, *e_cond;
989 if (co->op != EXEC_DO_WHILE)
990 return 0;
992 if (co->expr1 == NULL || co->expr1->expr_type == EXPR_CONSTANT)
993 return 0;
995 e_cond = co->expr1;
997 /* Generate the condition of the if statement, which is .not. the original
998 statement. */
999 e_not = gfc_get_expr ();
1000 e_not->ts = e_cond->ts;
1001 e_not->where = e_cond->where;
1002 e_not->expr_type = EXPR_OP;
1003 e_not->value.op.op = INTRINSIC_NOT;
1004 e_not->value.op.op1 = e_cond;
1006 /* Generate the EXIT statement. */
1007 c_exit = XCNEW (gfc_code);
1008 c_exit->op = EXEC_EXIT;
1009 c_exit->ext.which_construct = co;
1010 c_exit->loc = co->loc;
1012 /* Generate the IF statement. */
1013 c_if2 = XCNEW (gfc_code);
1014 c_if2->op = EXEC_IF;
1015 c_if2->expr1 = e_not;
1016 c_if2->next = c_exit;
1017 c_if2->loc = co->loc;
1019 /* ... plus the one to chain it to. */
1020 c_if1 = XCNEW (gfc_code);
1021 c_if1->op = EXEC_IF;
1022 c_if1->block = c_if2;
1023 c_if1->loc = co->loc;
1025 /* Make the DO WHILE loop into a DO block by replacing the condition
1026 with a true constant. */
1027 co->expr1 = gfc_get_logical_expr (gfc_default_integer_kind, &co->loc, true);
1029 /* Hang the generated if statement into the loop body. */
1031 loopblock = co->block->next;
1032 co->block->next = c_if1;
1033 c_if1->next = loopblock;
1035 return 0;
1038 /* Code callback function for converting
1039 if (a) then
1041 else if (b) then
1042 end if
1044 into
1045 if (a) then
1046 else
1047 if (b) then
1048 end if
1049 end if
1051 because otherwise common function elimination would place the BLOCKs
1052 into the wrong place. */
1054 static int
1055 convert_elseif (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
1056 void *data ATTRIBUTE_UNUSED)
1058 gfc_code *co = *c;
1059 gfc_code *c_if1, *c_if2, *else_stmt;
1061 if (co->op != EXEC_IF)
1062 return 0;
1064 /* This loop starts out with the first ELSE statement. */
1065 else_stmt = co->block->block;
1067 while (else_stmt != NULL)
1069 gfc_code *next_else;
1071 /* If there is no condition, we're done. */
1072 if (else_stmt->expr1 == NULL)
1073 break;
1075 next_else = else_stmt->block;
1077 /* Generate the new IF statement. */
1078 c_if2 = XCNEW (gfc_code);
1079 c_if2->op = EXEC_IF;
1080 c_if2->expr1 = else_stmt->expr1;
1081 c_if2->next = else_stmt->next;
1082 c_if2->loc = else_stmt->loc;
1083 c_if2->block = next_else;
1085 /* ... plus the one to chain it to. */
1086 c_if1 = XCNEW (gfc_code);
1087 c_if1->op = EXEC_IF;
1088 c_if1->block = c_if2;
1089 c_if1->loc = else_stmt->loc;
1091 /* Insert the new IF after the ELSE. */
1092 else_stmt->expr1 = NULL;
1093 else_stmt->next = c_if1;
1094 else_stmt->block = NULL;
1096 else_stmt = next_else;
1098 /* Don't walk subtrees. */
1099 return 0;
1102 struct do_stack
1104 struct do_stack *prev;
1105 gfc_iterator *iter;
1106 gfc_code *code;
1107 } *stack_top;
1109 /* Recursively traverse the block of a WRITE or READ statement, and maybe
1110 optimize by replacing do loops with their analog array slices. For
1111 example:
1113 write (*,*) (a(i), i=1,4)
1115 is replaced with
1117 write (*,*) a(1:4:1) . */
1119 static bool
1120 traverse_io_block (gfc_code *code, bool *has_reached, gfc_code *prev)
1122 gfc_code *curr;
1123 gfc_expr *new_e, *expr, *start;
1124 gfc_ref *ref;
1125 struct do_stack ds_push;
1126 int i, future_rank = 0;
1127 gfc_iterator *iters[GFC_MAX_DIMENSIONS];
1128 gfc_expr *e;
1130 /* Find the first transfer/do statement. */
1131 for (curr = code; curr; curr = curr->next)
1133 if (curr->op == EXEC_DO || curr->op == EXEC_TRANSFER)
1134 break;
1137 /* Ensure it is the only transfer/do statement because cases like
1139 write (*,*) (a(i), b(i), i=1,4)
1141 cannot be optimized. */
1143 if (!curr || curr->next)
1144 return false;
1146 if (curr->op == EXEC_DO)
1148 if (curr->ext.iterator->var->ref)
1149 return false;
1150 ds_push.prev = stack_top;
1151 ds_push.iter = curr->ext.iterator;
1152 ds_push.code = curr;
1153 stack_top = &ds_push;
1154 if (traverse_io_block (curr->block->next, has_reached, prev))
1156 if (curr != stack_top->code && !*has_reached)
1158 curr->block->next = NULL;
1159 gfc_free_statements (curr);
1161 else
1162 *has_reached = true;
1163 return true;
1165 return false;
1168 gcc_assert (curr->op == EXEC_TRANSFER);
1170 e = curr->expr1;
1171 ref = e->ref;
1172 if (!ref || ref->type != REF_ARRAY || ref->u.ar.codimen != 0 || ref->next)
1173 return false;
1175 /* Find the iterators belonging to each variable and check conditions. */
1176 for (i = 0; i < ref->u.ar.dimen; i++)
1178 if (!ref->u.ar.start[i] || ref->u.ar.start[i]->ref
1179 || ref->u.ar.dimen_type[i] != DIMEN_ELEMENT)
1180 return false;
1182 start = ref->u.ar.start[i];
1183 gfc_simplify_expr (start, 0);
1184 switch (start->expr_type)
1186 case EXPR_VARIABLE:
1188 /* write (*,*) (a(i), i=a%b,1) not handled yet. */
1189 if (start->ref)
1190 return false;
1192 /* Check for (a(k), i=1,4) or ((a(j, i), i=1,4), j=1,4). */
1193 if (!stack_top || !stack_top->iter
1194 || stack_top->iter->var->symtree != start->symtree)
1196 /* Check for (a(i,i), i=1,3). */
1197 int j;
1199 for (j=0; j<i; j++)
1200 if (iters[j] && iters[j]->var->symtree == start->symtree)
1201 return false;
1203 iters[i] = NULL;
1205 else
1207 iters[i] = stack_top->iter;
1208 stack_top = stack_top->prev;
1209 future_rank++;
1211 break;
1212 case EXPR_CONSTANT:
1213 iters[i] = NULL;
1214 break;
1215 case EXPR_OP:
1216 switch (start->value.op.op)
1218 case INTRINSIC_PLUS:
1219 case INTRINSIC_TIMES:
1220 if (start->value.op.op1->expr_type != EXPR_VARIABLE)
1221 std::swap (start->value.op.op1, start->value.op.op2);
1222 gcc_fallthrough ();
1223 case INTRINSIC_MINUS:
1224 if ((start->value.op.op1->expr_type!= EXPR_VARIABLE
1225 && start->value.op.op2->expr_type != EXPR_CONSTANT)
1226 || start->value.op.op1->ref)
1227 return false;
1228 if (!stack_top || !stack_top->iter
1229 || stack_top->iter->var->symtree
1230 != start->value.op.op1->symtree)
1231 return false;
1232 iters[i] = stack_top->iter;
1233 stack_top = stack_top->prev;
1234 break;
1235 default:
1236 return false;
1238 future_rank++;
1239 break;
1240 default:
1241 return false;
1245 /* Check for cases like ((a(i, j), i=1, j), j=1, 2). */
1246 for (int i = 1; i < ref->u.ar.dimen; i++)
1248 if (iters[i])
1250 gfc_expr *var = iters[i]->var;
1251 for (int j = i - 1; j < i; j++)
1253 if (iters[j]
1254 && (gfc_check_dependency (var, iters[j]->start, true)
1255 || gfc_check_dependency (var, iters[j]->end, true)
1256 || gfc_check_dependency (var, iters[j]->step, true)))
1257 return false;
1262 /* Create new expr. */
1263 new_e = gfc_copy_expr (curr->expr1);
1264 new_e->expr_type = EXPR_VARIABLE;
1265 new_e->rank = future_rank;
1266 if (curr->expr1->shape)
1267 new_e->shape = gfc_get_shape (new_e->rank);
1269 /* Assign new starts, ends and strides if necessary. */
1270 for (i = 0; i < ref->u.ar.dimen; i++)
1272 if (!iters[i])
1273 continue;
1274 start = ref->u.ar.start[i];
1275 switch (start->expr_type)
1277 case EXPR_CONSTANT:
1278 gfc_internal_error ("bad expression");
1279 break;
1280 case EXPR_VARIABLE:
1281 new_e->ref->u.ar.dimen_type[i] = DIMEN_RANGE;
1282 new_e->ref->u.ar.type = AR_SECTION;
1283 gfc_free_expr (new_e->ref->u.ar.start[i]);
1284 new_e->ref->u.ar.start[i] = gfc_copy_expr (iters[i]->start);
1285 new_e->ref->u.ar.end[i] = gfc_copy_expr (iters[i]->end);
1286 new_e->ref->u.ar.stride[i] = gfc_copy_expr (iters[i]->step);
1287 break;
1288 case EXPR_OP:
1289 new_e->ref->u.ar.dimen_type[i] = DIMEN_RANGE;
1290 new_e->ref->u.ar.type = AR_SECTION;
1291 gfc_free_expr (new_e->ref->u.ar.start[i]);
1292 expr = gfc_copy_expr (start);
1293 expr->value.op.op1 = gfc_copy_expr (iters[i]->start);
1294 new_e->ref->u.ar.start[i] = expr;
1295 gfc_simplify_expr (new_e->ref->u.ar.start[i], 0);
1296 expr = gfc_copy_expr (start);
1297 expr->value.op.op1 = gfc_copy_expr (iters[i]->end);
1298 new_e->ref->u.ar.end[i] = expr;
1299 gfc_simplify_expr (new_e->ref->u.ar.end[i], 0);
1300 switch (start->value.op.op)
1302 case INTRINSIC_MINUS:
1303 case INTRINSIC_PLUS:
1304 new_e->ref->u.ar.stride[i] = gfc_copy_expr (iters[i]->step);
1305 break;
1306 case INTRINSIC_TIMES:
1307 expr = gfc_copy_expr (start);
1308 expr->value.op.op1 = gfc_copy_expr (iters[i]->step);
1309 new_e->ref->u.ar.stride[i] = expr;
1310 gfc_simplify_expr (new_e->ref->u.ar.stride[i], 0);
1311 break;
1312 default:
1313 gfc_internal_error ("bad op");
1315 break;
1316 default:
1317 gfc_internal_error ("bad expression");
1320 curr->expr1 = new_e;
1322 /* Insert modified statement. Check whether the statement needs to be
1323 inserted at the lowest level. */
1324 if (!stack_top->iter)
1326 if (prev)
1328 curr->next = prev->next->next;
1329 prev->next = curr;
1331 else
1333 curr->next = stack_top->code->block->next->next->next;
1334 stack_top->code->block->next = curr;
1337 else
1338 stack_top->code->block->next = curr;
1339 return true;
1342 /* Function for the gfc_code_walker. If code is a READ or WRITE statement, it
1343 tries to optimize its block. */
1345 static int
1346 simplify_io_impl_do (gfc_code **code, int *walk_subtrees,
1347 void *data ATTRIBUTE_UNUSED)
1349 gfc_code **curr, *prev = NULL;
1350 struct do_stack write, first;
1351 bool b = false;
1352 *walk_subtrees = 1;
1353 if (!(*code)->block
1354 || ((*code)->block->op != EXEC_WRITE
1355 && (*code)->block->op != EXEC_READ))
1356 return 0;
1358 *walk_subtrees = 0;
1359 write.prev = NULL;
1360 write.iter = NULL;
1361 write.code = *code;
1363 for (curr = &(*code)->block; *curr; curr = &(*curr)->next)
1365 if ((*curr)->op == EXEC_DO)
1367 first.prev = &write;
1368 first.iter = (*curr)->ext.iterator;
1369 first.code = *curr;
1370 stack_top = &first;
1371 traverse_io_block ((*curr)->block->next, &b, prev);
1372 stack_top = NULL;
1374 prev = *curr;
1376 return 0;
1379 /* Optimize a namespace, including all contained namespaces.
1380 flag_frontend_optimize and flag_fronend_loop_interchange are
1381 handled separately. */
1383 static void
1384 optimize_namespace (gfc_namespace *ns)
1386 gfc_namespace *saved_ns = gfc_current_ns;
1387 current_ns = ns;
1388 gfc_current_ns = ns;
1389 forall_level = 0;
1390 iterator_level = 0;
1391 in_assoc_list = false;
1392 in_omp_workshare = false;
1394 if (flag_frontend_optimize)
1396 gfc_code_walker (&ns->code, simplify_io_impl_do, dummy_expr_callback, NULL);
1397 gfc_code_walker (&ns->code, convert_do_while, dummy_expr_callback, NULL);
1398 gfc_code_walker (&ns->code, convert_elseif, dummy_expr_callback, NULL);
1399 gfc_code_walker (&ns->code, cfe_code, cfe_expr_0, NULL);
1400 gfc_code_walker (&ns->code, optimize_code, optimize_expr, NULL);
1401 if (flag_inline_matmul_limit != 0)
1403 bool found;
1406 found = false;
1407 gfc_code_walker (&ns->code, matmul_to_var_code, matmul_to_var_expr,
1408 (void *) &found);
1410 while (found);
1412 gfc_code_walker (&ns->code, matmul_temp_args, dummy_expr_callback,
1413 NULL);
1414 gfc_code_walker (&ns->code, inline_matmul_assign, dummy_expr_callback,
1415 NULL);
1419 if (flag_frontend_loop_interchange)
1420 gfc_code_walker (&ns->code, index_interchange, dummy_expr_callback,
1421 NULL);
1423 /* BLOCKs are handled in the expression walker below. */
1424 for (ns = ns->contained; ns; ns = ns->sibling)
1426 if (ns->code == NULL || ns->code->op != EXEC_BLOCK)
1427 optimize_namespace (ns);
1429 gfc_current_ns = saved_ns;
1432 /* Handle dependencies for allocatable strings which potentially redefine
1433 themselves in an assignment. */
1435 static void
1436 realloc_strings (gfc_namespace *ns)
1438 current_ns = ns;
1439 gfc_code_walker (&ns->code, realloc_string_callback, dummy_expr_callback, NULL);
1441 for (ns = ns->contained; ns; ns = ns->sibling)
1443 if (ns->code == NULL || ns->code->op != EXEC_BLOCK)
1444 realloc_strings (ns);
1449 static void
1450 optimize_reduction (gfc_namespace *ns)
1452 current_ns = ns;
1453 gfc_code_walker (&ns->code, gfc_dummy_code_callback,
1454 callback_reduction, NULL);
1456 /* BLOCKs are handled in the expression walker below. */
1457 for (ns = ns->contained; ns; ns = ns->sibling)
1459 if (ns->code == NULL || ns->code->op != EXEC_BLOCK)
1460 optimize_reduction (ns);
1464 /* Replace code like
1465 a = matmul(b,c) + d
1466 with
1467 a = matmul(b,c) ; a = a + d
1468 where the array function is not elemental and not allocatable
1469 and does not depend on the left-hand side.
1472 static bool
1473 optimize_binop_array_assignment (gfc_code *c, gfc_expr **rhs, bool seen_op)
1475 gfc_expr *e;
1477 if (!*rhs)
1478 return false;
1480 e = *rhs;
1481 if (e->expr_type == EXPR_OP)
1483 switch (e->value.op.op)
1485 /* Unary operators and exponentiation: Only look at a single
1486 operand. */
1487 case INTRINSIC_NOT:
1488 case INTRINSIC_UPLUS:
1489 case INTRINSIC_UMINUS:
1490 case INTRINSIC_PARENTHESES:
1491 case INTRINSIC_POWER:
1492 if (optimize_binop_array_assignment (c, &e->value.op.op1, seen_op))
1493 return true;
1494 break;
1496 case INTRINSIC_CONCAT:
1497 /* Do not do string concatenations. */
1498 break;
1500 default:
1501 /* Binary operators. */
1502 if (optimize_binop_array_assignment (c, &e->value.op.op1, true))
1503 return true;
1505 if (optimize_binop_array_assignment (c, &e->value.op.op2, true))
1506 return true;
1508 break;
1511 else if (seen_op && e->expr_type == EXPR_FUNCTION && e->rank > 0
1512 && ! (e->value.function.esym
1513 && (e->value.function.esym->attr.elemental
1514 || e->value.function.esym->attr.allocatable
1515 || e->value.function.esym->ts.type != c->expr1->ts.type
1516 || e->value.function.esym->ts.kind != c->expr1->ts.kind))
1517 && ! (e->value.function.isym
1518 && (e->value.function.isym->elemental
1519 || e->ts.type != c->expr1->ts.type
1520 || e->ts.kind != c->expr1->ts.kind))
1521 && ! gfc_inline_intrinsic_function_p (e))
1524 gfc_code *n;
1525 gfc_expr *new_expr;
1527 /* Insert a new assignment statement after the current one. */
1528 n = XCNEW (gfc_code);
1529 n->op = EXEC_ASSIGN;
1530 n->loc = c->loc;
1531 n->next = c->next;
1532 c->next = n;
1534 n->expr1 = gfc_copy_expr (c->expr1);
1535 n->expr2 = c->expr2;
1536 new_expr = gfc_copy_expr (c->expr1);
1537 c->expr2 = e;
1538 *rhs = new_expr;
1540 return true;
1544 /* Nothing to optimize. */
1545 return false;
1548 /* Remove unneeded TRIMs at the end of expressions. */
1550 static bool
1551 remove_trim (gfc_expr *rhs)
1553 bool ret;
1555 ret = false;
1556 if (!rhs)
1557 return ret;
1559 /* Check for a // b // trim(c). Looping is probably not
1560 necessary because the parser usually generates
1561 (// (// a b ) trim(c) ) , but better safe than sorry. */
1563 while (rhs->expr_type == EXPR_OP
1564 && rhs->value.op.op == INTRINSIC_CONCAT)
1565 rhs = rhs->value.op.op2;
1567 while (rhs->expr_type == EXPR_FUNCTION && rhs->value.function.isym
1568 && rhs->value.function.isym->id == GFC_ISYM_TRIM)
1570 strip_function_call (rhs);
1571 /* Recursive call to catch silly stuff like trim ( a // trim(b)). */
1572 remove_trim (rhs);
1573 ret = true;
1576 return ret;
1579 /* Optimizations for an assignment. */
1581 static void
1582 optimize_assignment (gfc_code * c)
1584 gfc_expr *lhs, *rhs;
1586 lhs = c->expr1;
1587 rhs = c->expr2;
1589 if (lhs->ts.type == BT_CHARACTER && !lhs->ts.deferred)
1591 /* Optimize a = trim(b) to a = b. */
1592 remove_trim (rhs);
1594 /* Replace a = ' ' by a = '' to optimize away a memcpy. */
1595 if (is_empty_string (rhs))
1596 rhs->value.character.length = 0;
1599 if (lhs->rank > 0 && gfc_check_dependency (lhs, rhs, true) == 0)
1600 optimize_binop_array_assignment (c, &rhs, false);
1604 /* Remove an unneeded function call, modifying the expression.
1605 This replaces the function call with the value of its
1606 first argument. The rest of the argument list is freed. */
1608 static void
1609 strip_function_call (gfc_expr *e)
1611 gfc_expr *e1;
1612 gfc_actual_arglist *a;
1614 a = e->value.function.actual;
1616 /* We should have at least one argument. */
1617 gcc_assert (a->expr != NULL);
1619 e1 = a->expr;
1621 /* Free the remaining arglist, if any. */
1622 if (a->next)
1623 gfc_free_actual_arglist (a->next);
1625 /* Graft the argument expression onto the original function. */
1626 *e = *e1;
1627 free (e1);
1631 /* Optimization of lexical comparison functions. */
1633 static bool
1634 optimize_lexical_comparison (gfc_expr *e)
1636 if (e->expr_type != EXPR_FUNCTION || e->value.function.isym == NULL)
1637 return false;
1639 switch (e->value.function.isym->id)
1641 case GFC_ISYM_LLE:
1642 return optimize_comparison (e, INTRINSIC_LE);
1644 case GFC_ISYM_LGE:
1645 return optimize_comparison (e, INTRINSIC_GE);
1647 case GFC_ISYM_LGT:
1648 return optimize_comparison (e, INTRINSIC_GT);
1650 case GFC_ISYM_LLT:
1651 return optimize_comparison (e, INTRINSIC_LT);
1653 default:
1654 break;
1656 return false;
1659 /* Combine stuff like [a]>b into [a>b], for easier optimization later. Do not
1660 do CHARACTER because of possible pessimization involving character
1661 lengths. */
1663 static bool
1664 combine_array_constructor (gfc_expr *e)
1667 gfc_expr *op1, *op2;
1668 gfc_expr *scalar;
1669 gfc_expr *new_expr;
1670 gfc_constructor *c, *new_c;
1671 gfc_constructor_base oldbase, newbase;
1672 bool scalar_first;
1673 int n_elem;
1674 bool all_const;
1676 /* Array constructors have rank one. */
1677 if (e->rank != 1)
1678 return false;
1680 /* Don't try to combine association lists, this makes no sense
1681 and leads to an ICE. */
1682 if (in_assoc_list)
1683 return false;
1685 /* With FORALL, the BLOCKS created by create_var will cause an ICE. */
1686 if (forall_level > 0)
1687 return false;
1689 /* Inside an iterator, things can get hairy; we are likely to create
1690 an invalid temporary variable. */
1691 if (iterator_level > 0)
1692 return false;
1694 op1 = e->value.op.op1;
1695 op2 = e->value.op.op2;
1697 if (!op1 || !op2)
1698 return false;
1700 if (op1->expr_type == EXPR_ARRAY && op2->rank == 0)
1701 scalar_first = false;
1702 else if (op2->expr_type == EXPR_ARRAY && op1->rank == 0)
1704 scalar_first = true;
1705 op1 = e->value.op.op2;
1706 op2 = e->value.op.op1;
1708 else
1709 return false;
1711 if (op2->ts.type == BT_CHARACTER)
1712 return false;
1714 /* This might be an expanded constructor with very many constant values. If
1715 we perform the operation here, we might end up with a long compile time
1716 and actually longer execution time, so a length bound is in order here.
1717 If the constructor constains something which is not a constant, it did
1718 not come from an expansion, so leave it alone. */
1720 #define CONSTR_LEN_MAX 4
1722 oldbase = op1->value.constructor;
1724 n_elem = 0;
1725 all_const = true;
1726 for (c = gfc_constructor_first (oldbase); c; c = gfc_constructor_next(c))
1728 if (c->expr->expr_type != EXPR_CONSTANT)
1730 all_const = false;
1731 break;
1733 n_elem += 1;
1736 if (all_const && n_elem > CONSTR_LEN_MAX)
1737 return false;
1739 #undef CONSTR_LEN_MAX
1741 newbase = NULL;
1742 e->expr_type = EXPR_ARRAY;
1744 scalar = create_var (gfc_copy_expr (op2), "constr");
1746 for (c = gfc_constructor_first (oldbase); c;
1747 c = gfc_constructor_next (c))
1749 new_expr = gfc_get_expr ();
1750 new_expr->ts = e->ts;
1751 new_expr->expr_type = EXPR_OP;
1752 new_expr->rank = c->expr->rank;
1753 new_expr->where = c->expr->where;
1754 new_expr->value.op.op = e->value.op.op;
1756 if (scalar_first)
1758 new_expr->value.op.op1 = gfc_copy_expr (scalar);
1759 new_expr->value.op.op2 = gfc_copy_expr (c->expr);
1761 else
1763 new_expr->value.op.op1 = gfc_copy_expr (c->expr);
1764 new_expr->value.op.op2 = gfc_copy_expr (scalar);
1767 new_c = gfc_constructor_append_expr (&newbase, new_expr, &(e->where));
1768 new_c->iterator = c->iterator;
1769 c->iterator = NULL;
1772 gfc_free_expr (op1);
1773 gfc_free_expr (op2);
1774 gfc_free_expr (scalar);
1776 e->value.constructor = newbase;
1777 return true;
1780 /* Change (-1)**k into 1-ishift(iand(k,1),1) and
1781 2**k into ishift(1,k) */
1783 static bool
1784 optimize_power (gfc_expr *e)
1786 gfc_expr *op1, *op2;
1787 gfc_expr *iand, *ishft;
1789 if (e->ts.type != BT_INTEGER)
1790 return false;
1792 op1 = e->value.op.op1;
1794 if (op1 == NULL || op1->expr_type != EXPR_CONSTANT)
1795 return false;
1797 if (mpz_cmp_si (op1->value.integer, -1L) == 0)
1799 gfc_free_expr (op1);
1801 op2 = e->value.op.op2;
1803 if (op2 == NULL)
1804 return false;
1806 iand = gfc_build_intrinsic_call (current_ns, GFC_ISYM_IAND,
1807 "_internal_iand", e->where, 2, op2,
1808 gfc_get_int_expr (e->ts.kind,
1809 &e->where, 1));
1811 ishft = gfc_build_intrinsic_call (current_ns, GFC_ISYM_ISHFT,
1812 "_internal_ishft", e->where, 2, iand,
1813 gfc_get_int_expr (e->ts.kind,
1814 &e->where, 1));
1816 e->value.op.op = INTRINSIC_MINUS;
1817 e->value.op.op1 = gfc_get_int_expr (e->ts.kind, &e->where, 1);
1818 e->value.op.op2 = ishft;
1819 return true;
1821 else if (mpz_cmp_si (op1->value.integer, 2L) == 0)
1823 gfc_free_expr (op1);
1825 op2 = e->value.op.op2;
1826 if (op2 == NULL)
1827 return false;
1829 ishft = gfc_build_intrinsic_call (current_ns, GFC_ISYM_ISHFT,
1830 "_internal_ishft", e->where, 2,
1831 gfc_get_int_expr (e->ts.kind,
1832 &e->where, 1),
1833 op2);
1834 *e = *ishft;
1835 return true;
1838 else if (mpz_cmp_si (op1->value.integer, 1L) == 0)
1840 op2 = e->value.op.op2;
1841 if (op2 == NULL)
1842 return false;
1844 gfc_free_expr (op1);
1845 gfc_free_expr (op2);
1847 e->expr_type = EXPR_CONSTANT;
1848 e->value.op.op1 = NULL;
1849 e->value.op.op2 = NULL;
1850 mpz_init_set_si (e->value.integer, 1);
1851 /* Typespec and location are still OK. */
1852 return true;
1855 return false;
1858 /* Recursive optimization of operators. */
1860 static bool
1861 optimize_op (gfc_expr *e)
1863 bool changed;
1865 gfc_intrinsic_op op = e->value.op.op;
1867 changed = false;
1869 /* Only use new-style comparisons. */
1870 switch(op)
1872 case INTRINSIC_EQ_OS:
1873 op = INTRINSIC_EQ;
1874 break;
1876 case INTRINSIC_GE_OS:
1877 op = INTRINSIC_GE;
1878 break;
1880 case INTRINSIC_LE_OS:
1881 op = INTRINSIC_LE;
1882 break;
1884 case INTRINSIC_NE_OS:
1885 op = INTRINSIC_NE;
1886 break;
1888 case INTRINSIC_GT_OS:
1889 op = INTRINSIC_GT;
1890 break;
1892 case INTRINSIC_LT_OS:
1893 op = INTRINSIC_LT;
1894 break;
1896 default:
1897 break;
1900 switch (op)
1902 case INTRINSIC_EQ:
1903 case INTRINSIC_GE:
1904 case INTRINSIC_LE:
1905 case INTRINSIC_NE:
1906 case INTRINSIC_GT:
1907 case INTRINSIC_LT:
1908 changed = optimize_comparison (e, op);
1910 gcc_fallthrough ();
1911 /* Look at array constructors. */
1912 case INTRINSIC_PLUS:
1913 case INTRINSIC_MINUS:
1914 case INTRINSIC_TIMES:
1915 case INTRINSIC_DIVIDE:
1916 return combine_array_constructor (e) || changed;
1918 case INTRINSIC_POWER:
1919 return optimize_power (e);
1921 default:
1922 break;
1925 return false;
1929 /* Return true if a constant string contains only blanks. */
1931 static bool
1932 is_empty_string (gfc_expr *e)
1934 int i;
1936 if (e->ts.type != BT_CHARACTER || e->expr_type != EXPR_CONSTANT)
1937 return false;
1939 for (i=0; i < e->value.character.length; i++)
1941 if (e->value.character.string[i] != ' ')
1942 return false;
1945 return true;
1949 /* Insert a call to the intrinsic len_trim. Use a different name for
1950 the symbol tree so we don't run into trouble when the user has
1951 renamed len_trim for some reason. */
1953 static gfc_expr*
1954 get_len_trim_call (gfc_expr *str, int kind)
1956 gfc_expr *fcn;
1957 gfc_actual_arglist *actual_arglist, *next;
1959 fcn = gfc_get_expr ();
1960 fcn->expr_type = EXPR_FUNCTION;
1961 fcn->value.function.isym = gfc_intrinsic_function_by_id (GFC_ISYM_LEN_TRIM);
1962 actual_arglist = gfc_get_actual_arglist ();
1963 actual_arglist->expr = str;
1964 next = gfc_get_actual_arglist ();
1965 next->expr = gfc_get_int_expr (gfc_default_integer_kind, NULL, kind);
1966 actual_arglist->next = next;
1968 fcn->value.function.actual = actual_arglist;
1969 fcn->where = str->where;
1970 fcn->ts.type = BT_INTEGER;
1971 fcn->ts.kind = gfc_charlen_int_kind;
1973 gfc_get_sym_tree ("__internal_len_trim", current_ns, &fcn->symtree, false);
1974 fcn->symtree->n.sym->ts = fcn->ts;
1975 fcn->symtree->n.sym->attr.flavor = FL_PROCEDURE;
1976 fcn->symtree->n.sym->attr.function = 1;
1977 fcn->symtree->n.sym->attr.elemental = 1;
1978 fcn->symtree->n.sym->attr.referenced = 1;
1979 fcn->symtree->n.sym->attr.access = ACCESS_PRIVATE;
1980 gfc_commit_symbol (fcn->symtree->n.sym);
1982 return fcn;
1985 /* Optimize expressions for equality. */
1987 static bool
1988 optimize_comparison (gfc_expr *e, gfc_intrinsic_op op)
1990 gfc_expr *op1, *op2;
1991 bool change;
1992 int eq;
1993 bool result;
1994 gfc_actual_arglist *firstarg, *secondarg;
1996 if (e->expr_type == EXPR_OP)
1998 firstarg = NULL;
1999 secondarg = NULL;
2000 op1 = e->value.op.op1;
2001 op2 = e->value.op.op2;
2003 else if (e->expr_type == EXPR_FUNCTION)
2005 /* One of the lexical comparison functions. */
2006 firstarg = e->value.function.actual;
2007 secondarg = firstarg->next;
2008 op1 = firstarg->expr;
2009 op2 = secondarg->expr;
2011 else
2012 gcc_unreachable ();
2014 /* Strip off unneeded TRIM calls from string comparisons. */
2016 change = remove_trim (op1);
2018 if (remove_trim (op2))
2019 change = true;
2021 /* An expression of type EXPR_CONSTANT is only valid for scalars. */
2022 /* TODO: A scalar constant may be acceptable in some cases (the scalarizer
2023 handles them well). However, there are also cases that need a non-scalar
2024 argument. For example the any intrinsic. See PR 45380. */
2025 if (e->rank > 0)
2026 return change;
2028 /* Replace a == '' with len_trim(a) == 0 and a /= '' with
2029 len_trim(a) != 0 */
2030 if (op1->ts.type == BT_CHARACTER && op2->ts.type == BT_CHARACTER
2031 && (op == INTRINSIC_EQ || op == INTRINSIC_NE))
2033 bool empty_op1, empty_op2;
2034 empty_op1 = is_empty_string (op1);
2035 empty_op2 = is_empty_string (op2);
2037 if (empty_op1 || empty_op2)
2039 gfc_expr *fcn;
2040 gfc_expr *zero;
2041 gfc_expr *str;
2043 /* This can only happen when an error for comparing
2044 characters of different kinds has already been issued. */
2045 if (empty_op1 && empty_op2)
2046 return false;
2048 zero = gfc_get_int_expr (gfc_charlen_int_kind, &e->where, 0);
2049 str = empty_op1 ? op2 : op1;
2051 fcn = get_len_trim_call (str, gfc_charlen_int_kind);
2054 if (empty_op1)
2055 gfc_free_expr (op1);
2056 else
2057 gfc_free_expr (op2);
2059 op1 = fcn;
2060 op2 = zero;
2061 e->value.op.op1 = fcn;
2062 e->value.op.op2 = zero;
2067 /* Don't compare REAL or COMPLEX expressions when honoring NaNs. */
2069 if (flag_finite_math_only
2070 || (op1->ts.type != BT_REAL && op2->ts.type != BT_REAL
2071 && op1->ts.type != BT_COMPLEX && op2->ts.type != BT_COMPLEX))
2073 eq = gfc_dep_compare_expr (op1, op2);
2074 if (eq <= -2)
2076 /* Replace A // B < A // C with B < C, and A // B < C // B
2077 with A < C. */
2078 if (op1->ts.type == BT_CHARACTER && op2->ts.type == BT_CHARACTER
2079 && op1->expr_type == EXPR_OP
2080 && op1->value.op.op == INTRINSIC_CONCAT
2081 && op2->expr_type == EXPR_OP
2082 && op2->value.op.op == INTRINSIC_CONCAT)
2084 gfc_expr *op1_left = op1->value.op.op1;
2085 gfc_expr *op2_left = op2->value.op.op1;
2086 gfc_expr *op1_right = op1->value.op.op2;
2087 gfc_expr *op2_right = op2->value.op.op2;
2089 if (gfc_dep_compare_expr (op1_left, op2_left) == 0)
2091 /* Watch out for 'A ' // x vs. 'A' // x. */
2093 if (op1_left->expr_type == EXPR_CONSTANT
2094 && op2_left->expr_type == EXPR_CONSTANT
2095 && op1_left->value.character.length
2096 != op2_left->value.character.length)
2097 return change;
2098 else
2100 free (op1_left);
2101 free (op2_left);
2102 if (firstarg)
2104 firstarg->expr = op1_right;
2105 secondarg->expr = op2_right;
2107 else
2109 e->value.op.op1 = op1_right;
2110 e->value.op.op2 = op2_right;
2112 optimize_comparison (e, op);
2113 return true;
2116 if (gfc_dep_compare_expr (op1_right, op2_right) == 0)
2118 free (op1_right);
2119 free (op2_right);
2120 if (firstarg)
2122 firstarg->expr = op1_left;
2123 secondarg->expr = op2_left;
2125 else
2127 e->value.op.op1 = op1_left;
2128 e->value.op.op2 = op2_left;
2131 optimize_comparison (e, op);
2132 return true;
2136 else
2138 /* eq can only be -1, 0 or 1 at this point. */
2139 switch (op)
2141 case INTRINSIC_EQ:
2142 result = eq == 0;
2143 break;
2145 case INTRINSIC_GE:
2146 result = eq >= 0;
2147 break;
2149 case INTRINSIC_LE:
2150 result = eq <= 0;
2151 break;
2153 case INTRINSIC_NE:
2154 result = eq != 0;
2155 break;
2157 case INTRINSIC_GT:
2158 result = eq > 0;
2159 break;
2161 case INTRINSIC_LT:
2162 result = eq < 0;
2163 break;
2165 default:
2166 gfc_internal_error ("illegal OP in optimize_comparison");
2167 break;
2170 /* Replace the expression by a constant expression. The typespec
2171 and where remains the way it is. */
2172 free (op1);
2173 free (op2);
2174 e->expr_type = EXPR_CONSTANT;
2175 e->value.logical = result;
2176 return true;
2180 return change;
2183 /* Optimize a trim function by replacing it with an equivalent substring
2184 involving a call to len_trim. This only works for expressions where
2185 variables are trimmed. Return true if anything was modified. */
2187 static bool
2188 optimize_trim (gfc_expr *e)
2190 gfc_expr *a;
2191 gfc_ref *ref;
2192 gfc_expr *fcn;
2193 gfc_ref **rr = NULL;
2195 /* Don't do this optimization within an argument list, because
2196 otherwise aliasing issues may occur. */
2198 if (count_arglist != 1)
2199 return false;
2201 if (e->ts.type != BT_CHARACTER || e->expr_type != EXPR_FUNCTION
2202 || e->value.function.isym == NULL
2203 || e->value.function.isym->id != GFC_ISYM_TRIM)
2204 return false;
2206 a = e->value.function.actual->expr;
2208 if (a->expr_type != EXPR_VARIABLE)
2209 return false;
2211 /* This would pessimize the idiom a = trim(a) for reallocatable strings. */
2213 if (a->symtree->n.sym->attr.allocatable)
2214 return false;
2216 /* Follow all references to find the correct place to put the newly
2217 created reference. FIXME: Also handle substring references and
2218 array references. Array references cause strange regressions at
2219 the moment. */
2221 if (a->ref)
2223 for (rr = &(a->ref); *rr; rr = &((*rr)->next))
2225 if ((*rr)->type == REF_SUBSTRING || (*rr)->type == REF_ARRAY)
2226 return false;
2230 strip_function_call (e);
2232 if (e->ref == NULL)
2233 rr = &(e->ref);
2235 /* Create the reference. */
2237 ref = gfc_get_ref ();
2238 ref->type = REF_SUBSTRING;
2240 /* Set the start of the reference. */
2242 ref->u.ss.start = gfc_get_int_expr (gfc_charlen_int_kind, NULL, 1);
2244 /* Build the function call to len_trim(x, gfc_default_integer_kind). */
2246 fcn = get_len_trim_call (gfc_copy_expr (e), gfc_charlen_int_kind);
2248 /* Set the end of the reference to the call to len_trim. */
2250 ref->u.ss.end = fcn;
2251 gcc_assert (rr != NULL && *rr == NULL);
2252 *rr = ref;
2253 return true;
2256 /* Optimize minloc(b), where b is rank 1 array, into
2257 (/ minloc(b, dim=1) /), and similarly for maxloc,
2258 as the latter forms are expanded inline. */
2260 static void
2261 optimize_minmaxloc (gfc_expr **e)
2263 gfc_expr *fn = *e;
2264 gfc_actual_arglist *a;
2265 char *name, *p;
2267 if (fn->rank != 1
2268 || fn->value.function.actual == NULL
2269 || fn->value.function.actual->expr == NULL
2270 || fn->value.function.actual->expr->rank != 1)
2271 return;
2273 *e = gfc_get_array_expr (fn->ts.type, fn->ts.kind, &fn->where);
2274 (*e)->shape = fn->shape;
2275 fn->rank = 0;
2276 fn->shape = NULL;
2277 gfc_constructor_append_expr (&(*e)->value.constructor, fn, &fn->where);
2279 name = XALLOCAVEC (char, strlen (fn->value.function.name) + 1);
2280 strcpy (name, fn->value.function.name);
2281 p = strstr (name, "loc0");
2282 p[3] = '1';
2283 fn->value.function.name = gfc_get_string ("%s", name);
2284 if (fn->value.function.actual->next)
2286 a = fn->value.function.actual->next;
2287 gcc_assert (a->expr == NULL);
2289 else
2291 a = gfc_get_actual_arglist ();
2292 fn->value.function.actual->next = a;
2294 a->expr = gfc_get_constant_expr (BT_INTEGER, gfc_default_integer_kind,
2295 &fn->where);
2296 mpz_set_ui (a->expr->value.integer, 1);
2299 /* Callback function for code checking that we do not pass a DO variable to an
2300 INTENT(OUT) or INTENT(INOUT) dummy variable. */
2302 static int
2303 doloop_code (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
2304 void *data ATTRIBUTE_UNUSED)
2306 gfc_code *co;
2307 int i;
2308 gfc_formal_arglist *f;
2309 gfc_actual_arglist *a;
2310 gfc_code *cl;
2311 do_t loop, *lp;
2312 bool seen_goto;
2314 co = *c;
2316 /* If the doloop_list grew, we have to truncate it here. */
2318 if ((unsigned) doloop_level < doloop_list.length())
2319 doloop_list.truncate (doloop_level);
2321 seen_goto = false;
2322 switch (co->op)
2324 case EXEC_DO:
2326 if (co->ext.iterator && co->ext.iterator->var)
2327 loop.c = co;
2328 else
2329 loop.c = NULL;
2331 loop.branch_level = if_level + select_level;
2332 loop.seen_goto = false;
2333 doloop_list.safe_push (loop);
2334 break;
2336 /* If anything could transfer control away from a suspicious
2337 subscript, make sure to set seen_goto in the current DO loop
2338 (if any). */
2339 case EXEC_GOTO:
2340 case EXEC_EXIT:
2341 case EXEC_STOP:
2342 case EXEC_ERROR_STOP:
2343 case EXEC_CYCLE:
2344 seen_goto = true;
2345 break;
2347 case EXEC_OPEN:
2348 if (co->ext.open->err)
2349 seen_goto = true;
2350 break;
2352 case EXEC_CLOSE:
2353 if (co->ext.close->err)
2354 seen_goto = true;
2355 break;
2357 case EXEC_BACKSPACE:
2358 case EXEC_ENDFILE:
2359 case EXEC_REWIND:
2360 case EXEC_FLUSH:
2362 if (co->ext.filepos->err)
2363 seen_goto = true;
2364 break;
2366 case EXEC_INQUIRE:
2367 if (co->ext.filepos->err)
2368 seen_goto = true;
2369 break;
2371 case EXEC_READ:
2372 case EXEC_WRITE:
2373 if (co->ext.dt->err || co->ext.dt->end || co->ext.dt->eor)
2374 seen_goto = true;
2375 break;
2377 case EXEC_WAIT:
2378 if (co->ext.wait->err || co->ext.wait->end || co->ext.wait->eor)
2379 loop.seen_goto = true;
2380 break;
2382 case EXEC_CALL:
2384 if (co->resolved_sym == NULL)
2385 break;
2387 f = gfc_sym_get_dummy_args (co->resolved_sym);
2389 /* Withot a formal arglist, there is only unknown INTENT,
2390 which we don't check for. */
2391 if (f == NULL)
2392 break;
2394 a = co->ext.actual;
2396 while (a && f)
2398 FOR_EACH_VEC_ELT (doloop_list, i, lp)
2400 gfc_symbol *do_sym;
2401 cl = lp->c;
2403 if (cl == NULL)
2404 break;
2406 do_sym = cl->ext.iterator->var->symtree->n.sym;
2408 if (a->expr && a->expr->symtree
2409 && a->expr->symtree->n.sym == do_sym)
2411 if (f->sym->attr.intent == INTENT_OUT)
2412 gfc_error_now ("Variable %qs at %L set to undefined "
2413 "value inside loop beginning at %L as "
2414 "INTENT(OUT) argument to subroutine %qs",
2415 do_sym->name, &a->expr->where,
2416 &(doloop_list[i].c->loc),
2417 co->symtree->n.sym->name);
2418 else if (f->sym->attr.intent == INTENT_INOUT)
2419 gfc_error_now ("Variable %qs at %L not definable inside "
2420 "loop beginning at %L as INTENT(INOUT) "
2421 "argument to subroutine %qs",
2422 do_sym->name, &a->expr->where,
2423 &(doloop_list[i].c->loc),
2424 co->symtree->n.sym->name);
2427 a = a->next;
2428 f = f->next;
2430 break;
2432 default:
2433 break;
2435 if (seen_goto && doloop_level > 0)
2436 doloop_list[doloop_level-1].seen_goto = true;
2438 return 0;
2441 /* Callback function to warn about different things within DO loops. */
2443 static int
2444 do_function (gfc_expr **e, int *walk_subtrees ATTRIBUTE_UNUSED,
2445 void *data ATTRIBUTE_UNUSED)
2447 do_t *last;
2449 if (doloop_list.length () == 0)
2450 return 0;
2452 if ((*e)->expr_type == EXPR_FUNCTION)
2453 do_intent (e);
2455 last = &doloop_list.last();
2456 if (last->seen_goto && !warn_do_subscript)
2457 return 0;
2459 if ((*e)->expr_type == EXPR_VARIABLE)
2460 do_subscript (e);
2462 return 0;
2465 typedef struct
2467 gfc_symbol *sym;
2468 mpz_t val;
2469 } insert_index_t;
2471 /* Callback function - if the expression is the variable in data->sym,
2472 replace it with a constant from data->val. */
2474 static int
2475 callback_insert_index (gfc_expr **e, int *walk_subtrees ATTRIBUTE_UNUSED,
2476 void *data)
2478 insert_index_t *d;
2479 gfc_expr *ex, *n;
2481 ex = (*e);
2482 if (ex->expr_type != EXPR_VARIABLE)
2483 return 0;
2485 d = (insert_index_t *) data;
2486 if (ex->symtree->n.sym != d->sym)
2487 return 0;
2489 n = gfc_get_constant_expr (BT_INTEGER, ex->ts.kind, &ex->where);
2490 mpz_set (n->value.integer, d->val);
2492 gfc_free_expr (ex);
2493 *e = n;
2494 return 0;
2497 /* In the expression e, replace occurrences of the variable sym with
2498 val. If this results in a constant expression, return true and
2499 return the value in ret. Return false if the expression already
2500 is a constant. Caller has to clear ret in that case. */
2502 static bool
2503 insert_index (gfc_expr *e, gfc_symbol *sym, mpz_t val, mpz_t ret)
2505 gfc_expr *n;
2506 insert_index_t data;
2507 bool rc;
2509 if (e->expr_type == EXPR_CONSTANT)
2510 return false;
2512 n = gfc_copy_expr (e);
2513 data.sym = sym;
2514 mpz_init_set (data.val, val);
2515 gfc_expr_walker (&n, callback_insert_index, (void *) &data);
2516 gfc_simplify_expr (n, 0);
2518 if (n->expr_type == EXPR_CONSTANT)
2520 rc = true;
2521 mpz_init_set (ret, n->value.integer);
2523 else
2524 rc = false;
2526 mpz_clear (data.val);
2527 gfc_free_expr (n);
2528 return rc;
2532 /* Check array subscripts for possible out-of-bounds accesses in DO
2533 loops with constant bounds. */
2535 static int
2536 do_subscript (gfc_expr **e)
2538 gfc_expr *v;
2539 gfc_array_ref *ar;
2540 gfc_ref *ref;
2541 int i,j;
2542 gfc_code *dl;
2543 do_t *lp;
2545 v = *e;
2546 /* Constants are already checked. */
2547 if (v->expr_type == EXPR_CONSTANT)
2548 return 0;
2550 /* Wrong warnings will be generated in an associate list. */
2551 if (in_assoc_list)
2552 return 0;
2554 for (ref = v->ref; ref; ref = ref->next)
2556 if (ref->type == REF_ARRAY && ref->u.ar.type == AR_ELEMENT)
2558 ar = & ref->u.ar;
2559 FOR_EACH_VEC_ELT (doloop_list, j, lp)
2561 gfc_symbol *do_sym;
2562 mpz_t do_start, do_step, do_end;
2563 bool have_do_start, have_do_end;
2564 bool error_not_proven;
2565 int warn;
2567 dl = lp->c;
2568 if (dl == NULL)
2569 break;
2571 /* If we are within a branch, or a goto or equivalent
2572 was seen in the DO loop before, then we cannot prove that
2573 this expression is actually evaluated. Don't do anything
2574 unless we want to see it all. */
2575 error_not_proven = lp->seen_goto
2576 || lp->branch_level < if_level + select_level;
2578 if (error_not_proven && !warn_do_subscript)
2579 break;
2581 if (error_not_proven)
2582 warn = OPT_Wdo_subscript;
2583 else
2584 warn = 0;
2586 do_sym = dl->ext.iterator->var->symtree->n.sym;
2587 if (do_sym->ts.type != BT_INTEGER)
2588 continue;
2590 /* If we do not know about the stepsize, the loop may be zero trip.
2591 Do not warn in this case. */
2593 if (dl->ext.iterator->step->expr_type == EXPR_CONSTANT)
2594 mpz_init_set (do_step, dl->ext.iterator->step->value.integer);
2595 else
2596 continue;
2598 if (dl->ext.iterator->start->expr_type == EXPR_CONSTANT)
2600 have_do_start = true;
2601 mpz_init_set (do_start, dl->ext.iterator->start->value.integer);
2603 else
2604 have_do_start = false;
2607 if (dl->ext.iterator->end->expr_type == EXPR_CONSTANT)
2609 have_do_end = true;
2610 mpz_init_set (do_end, dl->ext.iterator->end->value.integer);
2612 else
2613 have_do_end = false;
2615 if (!have_do_start && !have_do_end)
2616 return 0;
2618 /* May have to correct the end value if the step does not equal
2619 one. */
2620 if (have_do_start && have_do_end && mpz_cmp_ui (do_step, 1) != 0)
2622 mpz_t diff, rem;
2624 mpz_init (diff);
2625 mpz_init (rem);
2626 mpz_sub (diff, do_end, do_start);
2627 mpz_tdiv_r (rem, diff, do_step);
2628 mpz_sub (do_end, do_end, rem);
2629 mpz_clear (diff);
2630 mpz_clear (rem);
2633 for (i = 0; i< ar->dimen; i++)
2635 mpz_t val;
2636 if (ar->dimen_type[i] == DIMEN_ELEMENT && have_do_start
2637 && insert_index (ar->start[i], do_sym, do_start, val))
2639 if (ar->as->lower[i]
2640 && ar->as->lower[i]->expr_type == EXPR_CONSTANT
2641 && mpz_cmp (val, ar->as->lower[i]->value.integer) < 0)
2642 gfc_warning (warn, "Array reference at %L out of bounds "
2643 "(%ld < %ld) in loop beginning at %L",
2644 &ar->start[i]->where, mpz_get_si (val),
2645 mpz_get_si (ar->as->lower[i]->value.integer),
2646 &doloop_list[j].c->loc);
2648 if (ar->as->upper[i]
2649 && ar->as->upper[i]->expr_type == EXPR_CONSTANT
2650 && mpz_cmp (val, ar->as->upper[i]->value.integer) > 0)
2651 gfc_warning (warn, "Array reference at %L out of bounds "
2652 "(%ld > %ld) in loop beginning at %L",
2653 &ar->start[i]->where, mpz_get_si (val),
2654 mpz_get_si (ar->as->upper[i]->value.integer),
2655 &doloop_list[j].c->loc);
2657 mpz_clear (val);
2660 if (ar->dimen_type[i] == DIMEN_ELEMENT && have_do_end
2661 && insert_index (ar->start[i], do_sym, do_end, val))
2663 if (ar->as->lower[i]
2664 && ar->as->lower[i]->expr_type == EXPR_CONSTANT
2665 && mpz_cmp (val, ar->as->lower[i]->value.integer) < 0)
2666 gfc_warning (warn, "Array reference at %L out of bounds "
2667 "(%ld < %ld) in loop beginning at %L",
2668 &ar->start[i]->where, mpz_get_si (val),
2669 mpz_get_si (ar->as->lower[i]->value.integer),
2670 &doloop_list[j].c->loc);
2672 if (ar->as->upper[i]
2673 && ar->as->upper[i]->expr_type == EXPR_CONSTANT
2674 && mpz_cmp (val, ar->as->upper[i]->value.integer) > 0)
2675 gfc_warning (warn, "Array reference at %L out of bounds "
2676 "(%ld > %ld) in loop beginning at %L",
2677 &ar->start[i]->where, mpz_get_si (val),
2678 mpz_get_si (ar->as->upper[i]->value.integer),
2679 &doloop_list[j].c->loc);
2681 mpz_clear (val);
2687 return 0;
2689 /* Function for functions checking that we do not pass a DO variable
2690 to an INTENT(OUT) or INTENT(INOUT) dummy variable. */
2692 static int
2693 do_intent (gfc_expr **e)
2695 gfc_formal_arglist *f;
2696 gfc_actual_arglist *a;
2697 gfc_expr *expr;
2698 gfc_code *dl;
2699 do_t *lp;
2700 int i;
2702 expr = *e;
2703 if (expr->expr_type != EXPR_FUNCTION)
2704 return 0;
2706 /* Intrinsic functions don't modify their arguments. */
2708 if (expr->value.function.isym)
2709 return 0;
2711 f = gfc_sym_get_dummy_args (expr->symtree->n.sym);
2713 /* Without a formal arglist, there is only unknown INTENT,
2714 which we don't check for. */
2715 if (f == NULL)
2716 return 0;
2718 a = expr->value.function.actual;
2720 while (a && f)
2722 FOR_EACH_VEC_ELT (doloop_list, i, lp)
2724 gfc_symbol *do_sym;
2725 dl = lp->c;
2726 if (dl == NULL)
2727 break;
2729 do_sym = dl->ext.iterator->var->symtree->n.sym;
2731 if (a->expr && a->expr->symtree
2732 && a->expr->symtree->n.sym == do_sym)
2734 if (f->sym->attr.intent == INTENT_OUT)
2735 gfc_error_now ("Variable %qs at %L set to undefined value "
2736 "inside loop beginning at %L as INTENT(OUT) "
2737 "argument to function %qs", do_sym->name,
2738 &a->expr->where, &doloop_list[i].c->loc,
2739 expr->symtree->n.sym->name);
2740 else if (f->sym->attr.intent == INTENT_INOUT)
2741 gfc_error_now ("Variable %qs at %L not definable inside loop"
2742 " beginning at %L as INTENT(INOUT) argument to"
2743 " function %qs", do_sym->name,
2744 &a->expr->where, &doloop_list[i].c->loc,
2745 expr->symtree->n.sym->name);
2748 a = a->next;
2749 f = f->next;
2752 return 0;
2755 static void
2756 doloop_warn (gfc_namespace *ns)
2758 gfc_code_walker (&ns->code, doloop_code, do_function, NULL);
2761 /* This selction deals with inlining calls to MATMUL. */
2763 /* Replace calls to matmul outside of straight assignments with a temporary
2764 variable so that later inlining will work. */
2766 static int
2767 matmul_to_var_expr (gfc_expr **ep, int *walk_subtrees ATTRIBUTE_UNUSED,
2768 void *data)
2770 gfc_expr *e, *n;
2771 bool *found = (bool *) data;
2773 e = *ep;
2775 if (e->expr_type != EXPR_FUNCTION
2776 || e->value.function.isym == NULL
2777 || e->value.function.isym->id != GFC_ISYM_MATMUL)
2778 return 0;
2780 if (forall_level > 0 || iterator_level > 0 || in_omp_workshare
2781 || in_where || in_assoc_list)
2782 return 0;
2784 /* Check if this is already in the form c = matmul(a,b). */
2786 if ((*current_code)->expr2 == e)
2787 return 0;
2789 n = create_var (e, "matmul");
2791 /* If create_var is unable to create a variable (for example if
2792 -fno-realloc-lhs is in force with a variable that does not have bounds
2793 known at compile-time), just return. */
2795 if (n == NULL)
2796 return 0;
2798 *ep = n;
2799 *found = true;
2800 return 0;
2803 /* Set current_code and associated variables so that matmul_to_var_expr can
2804 work. */
2806 static int
2807 matmul_to_var_code (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
2808 void *data ATTRIBUTE_UNUSED)
2810 if (current_code != c)
2812 current_code = c;
2813 inserted_block = NULL;
2814 changed_statement = NULL;
2817 return 0;
2821 /* Take a statement of the shape c = matmul(a,b) and create temporaries
2822 for a and b if there is a dependency between the arguments and the
2823 result variable or if a or b are the result of calculations that cannot
2824 be handled by the inliner. */
2826 static int
2827 matmul_temp_args (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
2828 void *data ATTRIBUTE_UNUSED)
2830 gfc_expr *expr1, *expr2;
2831 gfc_code *co;
2832 gfc_actual_arglist *a, *b;
2833 bool a_tmp, b_tmp;
2834 gfc_expr *matrix_a, *matrix_b;
2835 bool conjg_a, conjg_b, transpose_a, transpose_b;
2837 co = *c;
2839 if (co->op != EXEC_ASSIGN)
2840 return 0;
2842 if (forall_level > 0 || iterator_level > 0 || in_omp_workshare
2843 || in_where)
2844 return 0;
2846 /* This has some duplication with inline_matmul_assign. This
2847 is because the creation of temporary variables could still fail,
2848 and inline_matmul_assign still needs to be able to handle these
2849 cases. */
2850 expr1 = co->expr1;
2851 expr2 = co->expr2;
2853 if (expr2->expr_type != EXPR_FUNCTION
2854 || expr2->value.function.isym == NULL
2855 || expr2->value.function.isym->id != GFC_ISYM_MATMUL)
2856 return 0;
2858 a_tmp = false;
2859 a = expr2->value.function.actual;
2860 matrix_a = check_conjg_transpose_variable (a->expr, &conjg_a, &transpose_a);
2861 if (matrix_a != NULL)
2863 if (matrix_a->expr_type == EXPR_VARIABLE
2864 && (gfc_check_dependency (matrix_a, expr1, true)
2865 || has_dimen_vector_ref (matrix_a)))
2866 a_tmp = true;
2868 else
2869 a_tmp = true;
2871 b_tmp = false;
2872 b = a->next;
2873 matrix_b = check_conjg_transpose_variable (b->expr, &conjg_b, &transpose_b);
2874 if (matrix_b != NULL)
2876 if (matrix_b->expr_type == EXPR_VARIABLE
2877 && (gfc_check_dependency (matrix_b, expr1, true)
2878 || has_dimen_vector_ref (matrix_b)))
2879 b_tmp = true;
2881 else
2882 b_tmp = true;
2884 if (!a_tmp && !b_tmp)
2885 return 0;
2887 current_code = c;
2888 inserted_block = NULL;
2889 changed_statement = NULL;
2890 if (a_tmp)
2892 gfc_expr *at;
2893 at = create_var (a->expr,"mma");
2894 if (at)
2895 a->expr = at;
2897 if (b_tmp)
2899 gfc_expr *bt;
2900 bt = create_var (b->expr,"mmb");
2901 if (bt)
2902 b->expr = bt;
2904 return 0;
2907 /* Auxiliary function to build and simplify an array inquiry function.
2908 dim is zero-based. */
2910 static gfc_expr *
2911 get_array_inq_function (gfc_isym_id id, gfc_expr *e, int dim)
2913 gfc_expr *fcn;
2914 gfc_expr *dim_arg, *kind;
2915 const char *name;
2916 gfc_expr *ec;
2918 switch (id)
2920 case GFC_ISYM_LBOUND:
2921 name = "_gfortran_lbound";
2922 break;
2924 case GFC_ISYM_UBOUND:
2925 name = "_gfortran_ubound";
2926 break;
2928 case GFC_ISYM_SIZE:
2929 name = "_gfortran_size";
2930 break;
2932 default:
2933 gcc_unreachable ();
2936 dim_arg = gfc_get_int_expr (gfc_default_integer_kind, &e->where, dim);
2937 kind = gfc_get_int_expr (gfc_default_integer_kind, &e->where,
2938 gfc_index_integer_kind);
2940 ec = gfc_copy_expr (e);
2941 fcn = gfc_build_intrinsic_call (current_ns, id, name, e->where, 3,
2942 ec, dim_arg, kind);
2943 gfc_simplify_expr (fcn, 0);
2944 return fcn;
2947 /* Builds a logical expression. */
2949 static gfc_expr*
2950 build_logical_expr (gfc_intrinsic_op op, gfc_expr *e1, gfc_expr *e2)
2952 gfc_typespec ts;
2953 gfc_expr *res;
2955 ts.type = BT_LOGICAL;
2956 ts.kind = gfc_default_logical_kind;
2957 res = gfc_get_expr ();
2958 res->where = e1->where;
2959 res->expr_type = EXPR_OP;
2960 res->value.op.op = op;
2961 res->value.op.op1 = e1;
2962 res->value.op.op2 = e2;
2963 res->ts = ts;
2965 return res;
2969 /* Return an operation of one two gfc_expr (one if e2 is NULL). This assumes
2970 compatible typespecs. */
2972 static gfc_expr *
2973 get_operand (gfc_intrinsic_op op, gfc_expr *e1, gfc_expr *e2)
2975 gfc_expr *res;
2977 res = gfc_get_expr ();
2978 res->ts = e1->ts;
2979 res->where = e1->where;
2980 res->expr_type = EXPR_OP;
2981 res->value.op.op = op;
2982 res->value.op.op1 = e1;
2983 res->value.op.op2 = e2;
2984 gfc_simplify_expr (res, 0);
2985 return res;
2988 /* Generate the IF statement for a runtime check if we want to do inlining or
2989 not - putting in the code for both branches and putting it into the syntax
2990 tree is the caller's responsibility. For fixed array sizes, this should be
2991 removed by DCE. Only called for rank-two matrices A and B. */
2993 static gfc_code *
2994 inline_limit_check (gfc_expr *a, gfc_expr *b, enum matrix_case m_case)
2996 gfc_expr *inline_limit;
2997 gfc_code *if_1, *if_2, *else_2;
2998 gfc_expr *b2, *a2, *a1, *m1, *m2;
2999 gfc_typespec ts;
3000 gfc_expr *cond;
3002 gcc_assert (m_case == A2B2 || m_case == A2B2T || m_case == A2TB2);
3004 /* Calculation is done in real to avoid integer overflow. */
3006 inline_limit = gfc_get_constant_expr (BT_REAL, gfc_default_real_kind,
3007 &a->where);
3008 mpfr_set_si (inline_limit->value.real, flag_inline_matmul_limit,
3009 GFC_RND_MODE);
3010 mpfr_pow_ui (inline_limit->value.real, inline_limit->value.real, 3,
3011 GFC_RND_MODE);
3013 a1 = get_array_inq_function (GFC_ISYM_SIZE, a, 1);
3014 a2 = get_array_inq_function (GFC_ISYM_SIZE, a, 2);
3015 b2 = get_array_inq_function (GFC_ISYM_SIZE, b, 2);
3017 gfc_clear_ts (&ts);
3018 ts.type = BT_REAL;
3019 ts.kind = gfc_default_real_kind;
3020 gfc_convert_type_warn (a1, &ts, 2, 0);
3021 gfc_convert_type_warn (a2, &ts, 2, 0);
3022 gfc_convert_type_warn (b2, &ts, 2, 0);
3024 m1 = get_operand (INTRINSIC_TIMES, a1, a2);
3025 m2 = get_operand (INTRINSIC_TIMES, m1, b2);
3027 cond = build_logical_expr (INTRINSIC_LE, m2, inline_limit);
3028 gfc_simplify_expr (cond, 0);
3030 else_2 = XCNEW (gfc_code);
3031 else_2->op = EXEC_IF;
3032 else_2->loc = a->where;
3034 if_2 = XCNEW (gfc_code);
3035 if_2->op = EXEC_IF;
3036 if_2->expr1 = cond;
3037 if_2->loc = a->where;
3038 if_2->block = else_2;
3040 if_1 = XCNEW (gfc_code);
3041 if_1->op = EXEC_IF;
3042 if_1->block = if_2;
3043 if_1->loc = a->where;
3045 return if_1;
3049 /* Insert code to issue a runtime error if the expressions are not equal. */
3051 static gfc_code *
3052 runtime_error_ne (gfc_expr *e1, gfc_expr *e2, const char *msg)
3054 gfc_expr *cond;
3055 gfc_code *if_1, *if_2;
3056 gfc_code *c;
3057 gfc_actual_arglist *a1, *a2, *a3;
3059 gcc_assert (e1->where.lb);
3060 /* Build the call to runtime_error. */
3061 c = XCNEW (gfc_code);
3062 c->op = EXEC_CALL;
3063 c->loc = e1->where;
3065 /* Get a null-terminated message string. */
3067 a1 = gfc_get_actual_arglist ();
3068 a1->expr = gfc_get_character_expr (gfc_default_character_kind, &e1->where,
3069 msg, strlen(msg)+1);
3070 c->ext.actual = a1;
3072 /* Pass the value of the first expression. */
3073 a2 = gfc_get_actual_arglist ();
3074 a2->expr = gfc_copy_expr (e1);
3075 a1->next = a2;
3077 /* Pass the value of the second expression. */
3078 a3 = gfc_get_actual_arglist ();
3079 a3->expr = gfc_copy_expr (e2);
3080 a2->next = a3;
3082 gfc_check_fe_runtime_error (c->ext.actual);
3083 gfc_resolve_fe_runtime_error (c);
3085 if_2 = XCNEW (gfc_code);
3086 if_2->op = EXEC_IF;
3087 if_2->loc = e1->where;
3088 if_2->next = c;
3090 if_1 = XCNEW (gfc_code);
3091 if_1->op = EXEC_IF;
3092 if_1->block = if_2;
3093 if_1->loc = e1->where;
3095 cond = build_logical_expr (INTRINSIC_NE, e1, e2);
3096 gfc_simplify_expr (cond, 0);
3097 if_2->expr1 = cond;
3099 return if_1;
3102 /* Handle matrix reallocation. Caller is responsible to insert into
3103 the code tree.
3105 For the two-dimensional case, build
3107 if (allocated(c)) then
3108 if (size(c,1) /= size(a,1) .or. size(c,2) /= size(b,2)) then
3109 deallocate(c)
3110 allocate (c(size(a,1), size(b,2)))
3111 end if
3112 else
3113 allocate (c(size(a,1),size(b,2)))
3114 end if
3116 and for the other cases correspondingly.
3119 static gfc_code *
3120 matmul_lhs_realloc (gfc_expr *c, gfc_expr *a, gfc_expr *b,
3121 enum matrix_case m_case)
3124 gfc_expr *allocated, *alloc_expr;
3125 gfc_code *if_alloc_1, *if_alloc_2, *if_size_1, *if_size_2;
3126 gfc_code *else_alloc;
3127 gfc_code *deallocate, *allocate1, *allocate_else;
3128 gfc_array_ref *ar;
3129 gfc_expr *cond, *ne1, *ne2;
3131 if (warn_realloc_lhs)
3132 gfc_warning (OPT_Wrealloc_lhs,
3133 "Code for reallocating the allocatable array at %L will "
3134 "be added", &c->where);
3136 alloc_expr = gfc_copy_expr (c);
3138 ar = gfc_find_array_ref (alloc_expr);
3139 gcc_assert (ar && ar->type == AR_FULL);
3141 /* c comes in as a full ref. Change it into a copy and make it into an
3142 element ref so it has the right form for for ALLOCATE. In the same
3143 switch statement, also generate the size comparison for the secod IF
3144 statement. */
3146 ar->type = AR_ELEMENT;
3148 switch (m_case)
3150 case A2B2:
3151 ar->start[0] = get_array_inq_function (GFC_ISYM_SIZE, a, 1);
3152 ar->start[1] = get_array_inq_function (GFC_ISYM_SIZE, b, 2);
3153 ne1 = build_logical_expr (INTRINSIC_NE,
3154 get_array_inq_function (GFC_ISYM_SIZE, c, 1),
3155 get_array_inq_function (GFC_ISYM_SIZE, a, 1));
3156 ne2 = build_logical_expr (INTRINSIC_NE,
3157 get_array_inq_function (GFC_ISYM_SIZE, c, 2),
3158 get_array_inq_function (GFC_ISYM_SIZE, b, 2));
3159 cond = build_logical_expr (INTRINSIC_OR, ne1, ne2);
3160 break;
3162 case A2B2T:
3163 ar->start[0] = get_array_inq_function (GFC_ISYM_SIZE, a, 1);
3164 ar->start[1] = get_array_inq_function (GFC_ISYM_SIZE, b, 1);
3166 ne1 = build_logical_expr (INTRINSIC_NE,
3167 get_array_inq_function (GFC_ISYM_SIZE, c, 1),
3168 get_array_inq_function (GFC_ISYM_SIZE, a, 1));
3169 ne2 = build_logical_expr (INTRINSIC_NE,
3170 get_array_inq_function (GFC_ISYM_SIZE, c, 2),
3171 get_array_inq_function (GFC_ISYM_SIZE, b, 1));
3172 cond = build_logical_expr (INTRINSIC_OR, ne1, ne2);
3173 break;
3175 case A2TB2:
3177 ar->start[0] = get_array_inq_function (GFC_ISYM_SIZE, a, 2);
3178 ar->start[1] = get_array_inq_function (GFC_ISYM_SIZE, b, 2);
3180 ne1 = build_logical_expr (INTRINSIC_NE,
3181 get_array_inq_function (GFC_ISYM_SIZE, c, 1),
3182 get_array_inq_function (GFC_ISYM_SIZE, a, 2));
3183 ne2 = build_logical_expr (INTRINSIC_NE,
3184 get_array_inq_function (GFC_ISYM_SIZE, c, 2),
3185 get_array_inq_function (GFC_ISYM_SIZE, b, 2));
3186 cond = build_logical_expr (INTRINSIC_OR, ne1, ne2);
3187 break;
3189 case A2B1:
3190 ar->start[0] = get_array_inq_function (GFC_ISYM_SIZE, a, 1);
3191 cond = build_logical_expr (INTRINSIC_NE,
3192 get_array_inq_function (GFC_ISYM_SIZE, c, 1),
3193 get_array_inq_function (GFC_ISYM_SIZE, a, 2));
3194 break;
3196 case A1B2:
3197 ar->start[0] = get_array_inq_function (GFC_ISYM_SIZE, b, 2);
3198 cond = build_logical_expr (INTRINSIC_NE,
3199 get_array_inq_function (GFC_ISYM_SIZE, c, 1),
3200 get_array_inq_function (GFC_ISYM_SIZE, b, 2));
3201 break;
3203 default:
3204 gcc_unreachable();
3208 gfc_simplify_expr (cond, 0);
3210 /* We need two identical allocate statements in two
3211 branches of the IF statement. */
3213 allocate1 = XCNEW (gfc_code);
3214 allocate1->op = EXEC_ALLOCATE;
3215 allocate1->ext.alloc.list = gfc_get_alloc ();
3216 allocate1->loc = c->where;
3217 allocate1->ext.alloc.list->expr = gfc_copy_expr (alloc_expr);
3219 allocate_else = XCNEW (gfc_code);
3220 allocate_else->op = EXEC_ALLOCATE;
3221 allocate_else->ext.alloc.list = gfc_get_alloc ();
3222 allocate_else->loc = c->where;
3223 allocate_else->ext.alloc.list->expr = alloc_expr;
3225 allocated = gfc_build_intrinsic_call (current_ns, GFC_ISYM_ALLOCATED,
3226 "_gfortran_allocated", c->where,
3227 1, gfc_copy_expr (c));
3229 deallocate = XCNEW (gfc_code);
3230 deallocate->op = EXEC_DEALLOCATE;
3231 deallocate->ext.alloc.list = gfc_get_alloc ();
3232 deallocate->ext.alloc.list->expr = gfc_copy_expr (c);
3233 deallocate->next = allocate1;
3234 deallocate->loc = c->where;
3236 if_size_2 = XCNEW (gfc_code);
3237 if_size_2->op = EXEC_IF;
3238 if_size_2->expr1 = cond;
3239 if_size_2->loc = c->where;
3240 if_size_2->next = deallocate;
3242 if_size_1 = XCNEW (gfc_code);
3243 if_size_1->op = EXEC_IF;
3244 if_size_1->block = if_size_2;
3245 if_size_1->loc = c->where;
3247 else_alloc = XCNEW (gfc_code);
3248 else_alloc->op = EXEC_IF;
3249 else_alloc->loc = c->where;
3250 else_alloc->next = allocate_else;
3252 if_alloc_2 = XCNEW (gfc_code);
3253 if_alloc_2->op = EXEC_IF;
3254 if_alloc_2->expr1 = allocated;
3255 if_alloc_2->loc = c->where;
3256 if_alloc_2->next = if_size_1;
3257 if_alloc_2->block = else_alloc;
3259 if_alloc_1 = XCNEW (gfc_code);
3260 if_alloc_1->op = EXEC_IF;
3261 if_alloc_1->block = if_alloc_2;
3262 if_alloc_1->loc = c->where;
3264 return if_alloc_1;
3267 /* Callback function for has_function_or_op. */
3269 static int
3270 is_function_or_op (gfc_expr **e, int *walk_subtrees ATTRIBUTE_UNUSED,
3271 void *data ATTRIBUTE_UNUSED)
3273 if ((*e) == 0)
3274 return 0;
3275 else
3276 return (*e)->expr_type == EXPR_FUNCTION
3277 || (*e)->expr_type == EXPR_OP;
3280 /* Returns true if the expression contains a function. */
3282 static bool
3283 has_function_or_op (gfc_expr **e)
3285 if (e == NULL)
3286 return false;
3287 else
3288 return gfc_expr_walker (e, is_function_or_op, NULL);
3291 /* Freeze (assign to a temporary variable) a single expression. */
3293 static void
3294 freeze_expr (gfc_expr **ep)
3296 gfc_expr *ne;
3297 if (has_function_or_op (ep))
3299 ne = create_var (*ep, "freeze");
3300 *ep = ne;
3304 /* Go through an expression's references and assign them to temporary
3305 variables if they contain functions. This is usually done prior to
3306 front-end scalarization to avoid multiple invocations of functions. */
3308 static void
3309 freeze_references (gfc_expr *e)
3311 gfc_ref *r;
3312 gfc_array_ref *ar;
3313 int i;
3315 for (r=e->ref; r; r=r->next)
3317 if (r->type == REF_SUBSTRING)
3319 if (r->u.ss.start != NULL)
3320 freeze_expr (&r->u.ss.start);
3322 if (r->u.ss.end != NULL)
3323 freeze_expr (&r->u.ss.end);
3325 else if (r->type == REF_ARRAY)
3327 ar = &r->u.ar;
3328 switch (ar->type)
3330 case AR_FULL:
3331 break;
3333 case AR_SECTION:
3334 for (i=0; i<ar->dimen; i++)
3336 if (ar->dimen_type[i] == DIMEN_RANGE)
3338 freeze_expr (&ar->start[i]);
3339 freeze_expr (&ar->end[i]);
3340 freeze_expr (&ar->stride[i]);
3342 else if (ar->dimen_type[i] == DIMEN_ELEMENT)
3344 freeze_expr (&ar->start[i]);
3347 break;
3349 case AR_ELEMENT:
3350 for (i=0; i<ar->dimen; i++)
3351 freeze_expr (&ar->start[i]);
3352 break;
3354 default:
3355 break;
3361 /* Convert to gfc_index_integer_kind if needed, just do a copy otherwise. */
3363 static gfc_expr *
3364 convert_to_index_kind (gfc_expr *e)
3366 gfc_expr *res;
3368 gcc_assert (e != NULL);
3370 res = gfc_copy_expr (e);
3372 gcc_assert (e->ts.type == BT_INTEGER);
3374 if (res->ts.kind != gfc_index_integer_kind)
3376 gfc_typespec ts;
3377 gfc_clear_ts (&ts);
3378 ts.type = BT_INTEGER;
3379 ts.kind = gfc_index_integer_kind;
3381 gfc_convert_type_warn (e, &ts, 2, 0);
3384 return res;
3387 /* Function to create a DO loop including creation of the
3388 iteration variable. gfc_expr are copied.*/
3390 static gfc_code *
3391 create_do_loop (gfc_expr *start, gfc_expr *end, gfc_expr *step, locus *where,
3392 gfc_namespace *ns, char *vname)
3395 char name[GFC_MAX_SYMBOL_LEN +1];
3396 gfc_symtree *symtree;
3397 gfc_symbol *symbol;
3398 gfc_expr *i;
3399 gfc_code *n, *n2;
3401 /* Create an expression for the iteration variable. */
3402 if (vname)
3403 sprintf (name, "__var_%d_do_%s", var_num++, vname);
3404 else
3405 sprintf (name, "__var_%d_do", var_num++);
3408 if (gfc_get_sym_tree (name, ns, &symtree, false) != 0)
3409 gcc_unreachable ();
3411 /* Create the loop variable. */
3413 symbol = symtree->n.sym;
3414 symbol->ts.type = BT_INTEGER;
3415 symbol->ts.kind = gfc_index_integer_kind;
3416 symbol->attr.flavor = FL_VARIABLE;
3417 symbol->attr.referenced = 1;
3418 symbol->attr.dimension = 0;
3419 symbol->attr.fe_temp = 1;
3420 gfc_commit_symbol (symbol);
3422 i = gfc_get_expr ();
3423 i->expr_type = EXPR_VARIABLE;
3424 i->ts = symbol->ts;
3425 i->rank = 0;
3426 i->where = *where;
3427 i->symtree = symtree;
3429 /* ... and the nested DO statements. */
3430 n = XCNEW (gfc_code);
3431 n->op = EXEC_DO;
3432 n->loc = *where;
3433 n->ext.iterator = gfc_get_iterator ();
3434 n->ext.iterator->var = i;
3435 n->ext.iterator->start = convert_to_index_kind (start);
3436 n->ext.iterator->end = convert_to_index_kind (end);
3437 if (step)
3438 n->ext.iterator->step = convert_to_index_kind (step);
3439 else
3440 n->ext.iterator->step = gfc_get_int_expr (gfc_index_integer_kind,
3441 where, 1);
3443 n2 = XCNEW (gfc_code);
3444 n2->op = EXEC_DO;
3445 n2->loc = *where;
3446 n2->next = NULL;
3447 n->block = n2;
3448 return n;
3451 /* Get the upper bound of the DO loops for matmul along a dimension. This
3452 is one-based. */
3454 static gfc_expr*
3455 get_size_m1 (gfc_expr *e, int dimen)
3457 mpz_t size;
3458 gfc_expr *res;
3460 if (gfc_array_dimen_size (e, dimen - 1, &size))
3462 res = gfc_get_constant_expr (BT_INTEGER,
3463 gfc_index_integer_kind, &e->where);
3464 mpz_sub_ui (res->value.integer, size, 1);
3465 mpz_clear (size);
3467 else
3469 res = get_operand (INTRINSIC_MINUS,
3470 get_array_inq_function (GFC_ISYM_SIZE, e, dimen),
3471 gfc_get_int_expr (gfc_index_integer_kind,
3472 &e->where, 1));
3473 gfc_simplify_expr (res, 0);
3476 return res;
3479 /* Function to return a scalarized expression. It is assumed that indices are
3480 zero based to make generation of DO loops easier. A zero as index will
3481 access the first element along a dimension. Single element references will
3482 be skipped. A NULL as an expression will be replaced by a full reference.
3483 This assumes that the index loops have gfc_index_integer_kind, and that all
3484 references have been frozen. */
3486 static gfc_expr*
3487 scalarized_expr (gfc_expr *e_in, gfc_expr **index, int count_index)
3489 gfc_array_ref *ar;
3490 int i;
3491 int rank;
3492 gfc_expr *e;
3493 int i_index;
3494 bool was_fullref;
3496 e = gfc_copy_expr(e_in);
3498 rank = e->rank;
3500 ar = gfc_find_array_ref (e);
3502 /* We scalarize count_index variables, reducing the rank by count_index. */
3504 e->rank = rank - count_index;
3506 was_fullref = ar->type == AR_FULL;
3508 if (e->rank == 0)
3509 ar->type = AR_ELEMENT;
3510 else
3511 ar->type = AR_SECTION;
3513 /* Loop over the indices. For each index, create the expression
3514 index * stride + lbound(e, dim). */
3516 i_index = 0;
3517 for (i=0; i < ar->dimen; i++)
3519 if (was_fullref || ar->dimen_type[i] == DIMEN_RANGE)
3521 if (index[i_index] != NULL)
3523 gfc_expr *lbound, *nindex;
3524 gfc_expr *loopvar;
3526 loopvar = gfc_copy_expr (index[i_index]);
3528 if (ar->stride[i])
3530 gfc_expr *tmp;
3532 tmp = gfc_copy_expr(ar->stride[i]);
3533 if (tmp->ts.kind != gfc_index_integer_kind)
3535 gfc_typespec ts;
3536 gfc_clear_ts (&ts);
3537 ts.type = BT_INTEGER;
3538 ts.kind = gfc_index_integer_kind;
3539 gfc_convert_type (tmp, &ts, 2);
3541 nindex = get_operand (INTRINSIC_TIMES, loopvar, tmp);
3543 else
3544 nindex = loopvar;
3546 /* Calculate the lower bound of the expression. */
3547 if (ar->start[i])
3549 lbound = gfc_copy_expr (ar->start[i]);
3550 if (lbound->ts.kind != gfc_index_integer_kind)
3552 gfc_typespec ts;
3553 gfc_clear_ts (&ts);
3554 ts.type = BT_INTEGER;
3555 ts.kind = gfc_index_integer_kind;
3556 gfc_convert_type (lbound, &ts, 2);
3560 else
3562 gfc_expr *lbound_e;
3563 gfc_ref *ref;
3565 lbound_e = gfc_copy_expr (e_in);
3567 for (ref = lbound_e->ref; ref; ref = ref->next)
3568 if (ref->type == REF_ARRAY
3569 && (ref->u.ar.type == AR_FULL
3570 || ref->u.ar.type == AR_SECTION))
3571 break;
3573 if (ref->next)
3575 gfc_free_ref_list (ref->next);
3576 ref->next = NULL;
3579 if (!was_fullref)
3581 /* Look at full individual sections, like a(:). The first index
3582 is the lbound of a full ref. */
3583 int j;
3584 gfc_array_ref *ar;
3585 int to;
3587 ar = &ref->u.ar;
3589 /* For assumed size, we need to keep around the final
3590 reference in order not to get an error on resolution
3591 below, and we cannot use AR_FULL. */
3593 if (ar->as->type == AS_ASSUMED_SIZE)
3595 ar->type = AR_SECTION;
3596 to = ar->dimen - 1;
3598 else
3600 to = ar->dimen;
3601 ar->type = AR_FULL;
3604 for (j = 0; j < to; j++)
3606 gfc_free_expr (ar->start[j]);
3607 ar->start[j] = NULL;
3608 gfc_free_expr (ar->end[j]);
3609 ar->end[j] = NULL;
3610 gfc_free_expr (ar->stride[j]);
3611 ar->stride[j] = NULL;
3614 /* We have to get rid of the shape, if there is one. Do
3615 so by freeing it and calling gfc_resolve to rebuild
3616 it, if necessary. */
3618 if (lbound_e->shape)
3619 gfc_free_shape (&(lbound_e->shape), lbound_e->rank);
3621 lbound_e->rank = ar->dimen;
3622 gfc_resolve_expr (lbound_e);
3624 lbound = get_array_inq_function (GFC_ISYM_LBOUND, lbound_e,
3625 i + 1);
3626 gfc_free_expr (lbound_e);
3629 ar->dimen_type[i] = DIMEN_ELEMENT;
3631 gfc_free_expr (ar->start[i]);
3632 ar->start[i] = get_operand (INTRINSIC_PLUS, nindex, lbound);
3634 gfc_free_expr (ar->end[i]);
3635 ar->end[i] = NULL;
3636 gfc_free_expr (ar->stride[i]);
3637 ar->stride[i] = NULL;
3638 gfc_simplify_expr (ar->start[i], 0);
3640 else if (was_fullref)
3642 gfc_internal_error ("Scalarization using DIMEN_RANGE unimplemented");
3644 i_index ++;
3648 return e;
3651 /* Helper function to check for a dimen vector as subscript. */
3653 static bool
3654 has_dimen_vector_ref (gfc_expr *e)
3656 gfc_array_ref *ar;
3657 int i;
3659 ar = gfc_find_array_ref (e);
3660 gcc_assert (ar);
3661 if (ar->type == AR_FULL)
3662 return false;
3664 for (i=0; i<ar->dimen; i++)
3665 if (ar->dimen_type[i] == DIMEN_VECTOR)
3666 return true;
3668 return false;
3671 /* If handed an expression of the form
3673 TRANSPOSE(CONJG(A))
3675 check if A can be handled by matmul and return if there is an uneven number
3676 of CONJG calls. Return a pointer to the array when everything is OK, NULL
3677 otherwise. The caller has to check for the correct rank. */
3679 static gfc_expr*
3680 check_conjg_transpose_variable (gfc_expr *e, bool *conjg, bool *transpose)
3682 *conjg = false;
3683 *transpose = false;
3687 if (e->expr_type == EXPR_VARIABLE)
3689 gcc_assert (e->rank == 1 || e->rank == 2);
3690 return e;
3692 else if (e->expr_type == EXPR_FUNCTION)
3694 if (e->value.function.isym == NULL)
3695 return NULL;
3697 if (e->value.function.isym->id == GFC_ISYM_CONJG)
3698 *conjg = !*conjg;
3699 else if (e->value.function.isym->id == GFC_ISYM_TRANSPOSE)
3700 *transpose = !*transpose;
3701 else return NULL;
3703 else
3704 return NULL;
3706 e = e->value.function.actual->expr;
3708 while(1);
3710 return NULL;
3713 /* Inline assignments of the form c = matmul(a,b).
3714 Handle only the cases currently where b and c are rank-two arrays.
3716 This basically translates the code to
3718 BLOCK
3719 integer i,j,k
3720 c = 0
3721 do j=0, size(b,2)-1
3722 do k=0, size(a, 2)-1
3723 do i=0, size(a, 1)-1
3724 c(i * stride(c,1) + lbound(c,1), j * stride(c,2) + lbound(c,2)) =
3725 c(i * stride(c,1) + lbound(c,1), j * stride(c,2) + lbound(c,2)) +
3726 a(i * stride(a,1) + lbound(a,1), k * stride(a,2) + lbound(a,2)) *
3727 b(k * stride(b,1) + lbound(b,1), j * stride(b,2) + lbound(b,2))
3728 end do
3729 end do
3730 end do
3731 END BLOCK
3735 static int
3736 inline_matmul_assign (gfc_code **c, int *walk_subtrees,
3737 void *data ATTRIBUTE_UNUSED)
3739 gfc_code *co = *c;
3740 gfc_expr *expr1, *expr2;
3741 gfc_expr *matrix_a, *matrix_b;
3742 gfc_actual_arglist *a, *b;
3743 gfc_code *do_1, *do_2, *do_3, *assign_zero, *assign_matmul;
3744 gfc_expr *zero_e;
3745 gfc_expr *u1, *u2, *u3;
3746 gfc_expr *list[2];
3747 gfc_expr *ascalar, *bscalar, *cscalar;
3748 gfc_expr *mult;
3749 gfc_expr *var_1, *var_2, *var_3;
3750 gfc_expr *zero;
3751 gfc_namespace *ns;
3752 gfc_intrinsic_op op_times, op_plus;
3753 enum matrix_case m_case;
3754 int i;
3755 gfc_code *if_limit = NULL;
3756 gfc_code **next_code_point;
3757 bool conjg_a, conjg_b, transpose_a, transpose_b;
3759 if (co->op != EXEC_ASSIGN)
3760 return 0;
3762 if (in_where || in_assoc_list)
3763 return 0;
3765 /* The BLOCKS generated for the temporary variables and FORALL don't
3766 mix. */
3767 if (forall_level > 0)
3768 return 0;
3770 /* For now don't do anything in OpenMP workshare, it confuses
3771 its translation, which expects only the allowed statements in there.
3772 We should figure out how to parallelize this eventually. */
3773 if (in_omp_workshare)
3774 return 0;
3776 expr1 = co->expr1;
3777 expr2 = co->expr2;
3778 if (expr2->expr_type != EXPR_FUNCTION
3779 || expr2->value.function.isym == NULL
3780 || expr2->value.function.isym->id != GFC_ISYM_MATMUL)
3781 return 0;
3783 current_code = c;
3784 inserted_block = NULL;
3785 changed_statement = NULL;
3787 a = expr2->value.function.actual;
3788 matrix_a = check_conjg_transpose_variable (a->expr, &conjg_a, &transpose_a);
3789 if (matrix_a == NULL)
3790 return 0;
3792 b = a->next;
3793 matrix_b = check_conjg_transpose_variable (b->expr, &conjg_b, &transpose_b);
3794 if (matrix_b == NULL)
3795 return 0;
3797 if (has_dimen_vector_ref (expr1) || has_dimen_vector_ref (matrix_a)
3798 || has_dimen_vector_ref (matrix_b))
3799 return 0;
3801 /* We do not handle data dependencies yet. */
3802 if (gfc_check_dependency (expr1, matrix_a, true)
3803 || gfc_check_dependency (expr1, matrix_b, true))
3804 return 0;
3806 m_case = none;
3807 if (matrix_a->rank == 2)
3809 if (transpose_a)
3811 if (matrix_b->rank == 2 && !transpose_b)
3812 m_case = A2TB2;
3814 else
3816 if (matrix_b->rank == 1)
3817 m_case = A2B1;
3818 else /* matrix_b->rank == 2 */
3820 if (transpose_b)
3821 m_case = A2B2T;
3822 else
3823 m_case = A2B2;
3827 else /* matrix_a->rank == 1 */
3829 if (matrix_b->rank == 2)
3831 if (!transpose_b)
3832 m_case = A1B2;
3836 if (m_case == none)
3837 return 0;
3839 ns = insert_block ();
3841 /* Assign the type of the zero expression for initializing the resulting
3842 array, and the expression (+ and * for real, integer and complex;
3843 .and. and .or for logical. */
3845 switch(expr1->ts.type)
3847 case BT_INTEGER:
3848 zero_e = gfc_get_int_expr (expr1->ts.kind, &expr1->where, 0);
3849 op_times = INTRINSIC_TIMES;
3850 op_plus = INTRINSIC_PLUS;
3851 break;
3853 case BT_LOGICAL:
3854 op_times = INTRINSIC_AND;
3855 op_plus = INTRINSIC_OR;
3856 zero_e = gfc_get_logical_expr (expr1->ts.kind, &expr1->where,
3858 break;
3859 case BT_REAL:
3860 zero_e = gfc_get_constant_expr (BT_REAL, expr1->ts.kind,
3861 &expr1->where);
3862 mpfr_set_si (zero_e->value.real, 0, GFC_RND_MODE);
3863 op_times = INTRINSIC_TIMES;
3864 op_plus = INTRINSIC_PLUS;
3865 break;
3867 case BT_COMPLEX:
3868 zero_e = gfc_get_constant_expr (BT_COMPLEX, expr1->ts.kind,
3869 &expr1->where);
3870 mpc_set_si_si (zero_e->value.complex, 0, 0, GFC_RND_MODE);
3871 op_times = INTRINSIC_TIMES;
3872 op_plus = INTRINSIC_PLUS;
3874 break;
3876 default:
3877 gcc_unreachable();
3880 current_code = &ns->code;
3882 /* Freeze the references, keeping track of how many temporary variables were
3883 created. */
3884 n_vars = 0;
3885 freeze_references (matrix_a);
3886 freeze_references (matrix_b);
3887 freeze_references (expr1);
3889 if (n_vars == 0)
3890 next_code_point = current_code;
3891 else
3893 next_code_point = &ns->code;
3894 for (i=0; i<n_vars; i++)
3895 next_code_point = &(*next_code_point)->next;
3898 /* Take care of the inline flag. If the limit check evaluates to a
3899 constant, dead code elimination will eliminate the unneeded branch. */
3901 if (m_case == A2B2 && flag_inline_matmul_limit > 0)
3903 if_limit = inline_limit_check (matrix_a, matrix_b, m_case);
3905 /* Insert the original statement into the else branch. */
3906 if_limit->block->block->next = co;
3907 co->next = NULL;
3909 /* ... and the new ones go into the original one. */
3910 *next_code_point = if_limit;
3911 next_code_point = &if_limit->block->next;
3914 assign_zero = XCNEW (gfc_code);
3915 assign_zero->op = EXEC_ASSIGN;
3916 assign_zero->loc = co->loc;
3917 assign_zero->expr1 = gfc_copy_expr (expr1);
3918 assign_zero->expr2 = zero_e;
3920 /* Handle the reallocation, if needed. */
3921 if (flag_realloc_lhs && gfc_is_reallocatable_lhs (expr1))
3923 gfc_code *lhs_alloc;
3925 /* Only need to check a single dimension for the A2B2 case for
3926 bounds checking, the rest will be allocated. Also check this
3927 for A2B1. */
3929 if ((gfc_option.rtcheck & GFC_RTCHECK_BOUNDS) && (m_case == A2B2 || m_case == A2B1))
3931 gfc_code *test;
3932 gfc_expr *a2, *b1;
3934 a2 = get_array_inq_function (GFC_ISYM_SIZE, matrix_a, 2);
3935 b1 = get_array_inq_function (GFC_ISYM_SIZE, matrix_b, 1);
3936 test = runtime_error_ne (b1, a2, "Dimension of array B incorrect "
3937 "in MATMUL intrinsic: Is %ld, should be %ld");
3938 *next_code_point = test;
3939 next_code_point = &test->next;
3943 lhs_alloc = matmul_lhs_realloc (expr1, matrix_a, matrix_b, m_case);
3945 *next_code_point = lhs_alloc;
3946 next_code_point = &lhs_alloc->next;
3949 else if (gfc_option.rtcheck & GFC_RTCHECK_BOUNDS)
3951 gfc_code *test;
3952 gfc_expr *a2, *b1, *c1, *c2, *a1, *b2;
3954 if (m_case == A2B2 || m_case == A2B1)
3956 a2 = get_array_inq_function (GFC_ISYM_SIZE, matrix_a, 2);
3957 b1 = get_array_inq_function (GFC_ISYM_SIZE, matrix_b, 1);
3958 test = runtime_error_ne (b1, a2, "Dimension of array B incorrect "
3959 "in MATMUL intrinsic: Is %ld, should be %ld");
3960 *next_code_point = test;
3961 next_code_point = &test->next;
3963 c1 = get_array_inq_function (GFC_ISYM_SIZE, expr1, 1);
3964 a1 = get_array_inq_function (GFC_ISYM_SIZE, matrix_a, 1);
3966 if (m_case == A2B2)
3967 test = runtime_error_ne (c1, a1, "Incorrect extent in return array in "
3968 "MATMUL intrinsic for dimension 1: "
3969 "is %ld, should be %ld");
3970 else if (m_case == A2B1)
3971 test = runtime_error_ne (c1, a1, "Incorrect extent in return array in "
3972 "MATMUL intrinsic: "
3973 "is %ld, should be %ld");
3976 *next_code_point = test;
3977 next_code_point = &test->next;
3979 else if (m_case == A1B2)
3981 a1 = get_array_inq_function (GFC_ISYM_SIZE, matrix_a, 1);
3982 b1 = get_array_inq_function (GFC_ISYM_SIZE, matrix_b, 1);
3983 test = runtime_error_ne (b1, a1, "Dimension of array B incorrect "
3984 "in MATMUL intrinsic: Is %ld, should be %ld");
3985 *next_code_point = test;
3986 next_code_point = &test->next;
3988 c1 = get_array_inq_function (GFC_ISYM_SIZE, expr1, 1);
3989 b2 = get_array_inq_function (GFC_ISYM_SIZE, matrix_b, 2);
3991 test = runtime_error_ne (c1, b2, "Incorrect extent in return array in "
3992 "MATMUL intrinsic: "
3993 "is %ld, should be %ld");
3995 *next_code_point = test;
3996 next_code_point = &test->next;
3999 if (m_case == A2B2)
4001 c2 = get_array_inq_function (GFC_ISYM_SIZE, expr1, 2);
4002 b2 = get_array_inq_function (GFC_ISYM_SIZE, matrix_b, 2);
4003 test = runtime_error_ne (c2, b2, "Incorrect extent in return array in "
4004 "MATMUL intrinsic for dimension 2: is %ld, should be %ld");
4006 *next_code_point = test;
4007 next_code_point = &test->next;
4010 if (m_case == A2B2T)
4012 c1 = get_array_inq_function (GFC_ISYM_SIZE, expr1, 1);
4013 a1 = get_array_inq_function (GFC_ISYM_SIZE, matrix_a, 1);
4014 test = runtime_error_ne (c1, a1, "Incorrect extent in return array in "
4015 "MATMUL intrinsic for dimension 1: "
4016 "is %ld, should be %ld");
4018 *next_code_point = test;
4019 next_code_point = &test->next;
4021 c2 = get_array_inq_function (GFC_ISYM_SIZE, expr1, 2);
4022 b1 = get_array_inq_function (GFC_ISYM_SIZE, matrix_b, 1);
4023 test = runtime_error_ne (c2, b1, "Incorrect extent in return array in "
4024 "MATMUL intrinsic for dimension 2: "
4025 "is %ld, should be %ld");
4026 *next_code_point = test;
4027 next_code_point = &test->next;
4029 a2 = get_array_inq_function (GFC_ISYM_SIZE, matrix_a, 2);
4030 b2 = get_array_inq_function (GFC_ISYM_SIZE, matrix_b, 2);
4032 test = runtime_error_ne (b2, a2, "Incorrect extent in argument B in "
4033 "MATMUL intrnisic for dimension 2: "
4034 "is %ld, should be %ld");
4035 *next_code_point = test;
4036 next_code_point = &test->next;
4040 if (m_case == A2TB2)
4042 c1 = get_array_inq_function (GFC_ISYM_SIZE, expr1, 1);
4043 a2 = get_array_inq_function (GFC_ISYM_SIZE, matrix_a, 2);
4045 test = runtime_error_ne (c1, a2, "Incorrect extent in return array in "
4046 "MATMUL intrinsic for dimension 1: "
4047 "is %ld, should be %ld");
4049 *next_code_point = test;
4050 next_code_point = &test->next;
4052 c2 = get_array_inq_function (GFC_ISYM_SIZE, expr1, 2);
4053 b2 = get_array_inq_function (GFC_ISYM_SIZE, matrix_b, 2);
4054 test = runtime_error_ne (c2, b2, "Incorrect extent in return array in "
4055 "MATMUL intrinsic for dimension 2: "
4056 "is %ld, should be %ld");
4057 *next_code_point = test;
4058 next_code_point = &test->next;
4060 a1 = get_array_inq_function (GFC_ISYM_SIZE, matrix_a, 1);
4061 b1 = get_array_inq_function (GFC_ISYM_SIZE, matrix_b, 1);
4063 test = runtime_error_ne (b1, a1, "Incorrect extent in argument B in "
4064 "MATMUL intrnisic for dimension 2: "
4065 "is %ld, should be %ld");
4066 *next_code_point = test;
4067 next_code_point = &test->next;
4072 *next_code_point = assign_zero;
4074 zero = gfc_get_int_expr (gfc_index_integer_kind, &co->loc, 0);
4076 assign_matmul = XCNEW (gfc_code);
4077 assign_matmul->op = EXEC_ASSIGN;
4078 assign_matmul->loc = co->loc;
4080 /* Get the bounds for the loops, create them and create the scalarized
4081 expressions. */
4083 switch (m_case)
4085 case A2B2:
4086 inline_limit_check (matrix_a, matrix_b, m_case);
4088 u1 = get_size_m1 (matrix_b, 2);
4089 u2 = get_size_m1 (matrix_a, 2);
4090 u3 = get_size_m1 (matrix_a, 1);
4092 do_1 = create_do_loop (gfc_copy_expr (zero), u1, NULL, &co->loc, ns);
4093 do_2 = create_do_loop (gfc_copy_expr (zero), u2, NULL, &co->loc, ns);
4094 do_3 = create_do_loop (gfc_copy_expr (zero), u3, NULL, &co->loc, ns);
4096 do_1->block->next = do_2;
4097 do_2->block->next = do_3;
4098 do_3->block->next = assign_matmul;
4100 var_1 = do_1->ext.iterator->var;
4101 var_2 = do_2->ext.iterator->var;
4102 var_3 = do_3->ext.iterator->var;
4104 list[0] = var_3;
4105 list[1] = var_1;
4106 cscalar = scalarized_expr (co->expr1, list, 2);
4108 list[0] = var_3;
4109 list[1] = var_2;
4110 ascalar = scalarized_expr (matrix_a, list, 2);
4112 list[0] = var_2;
4113 list[1] = var_1;
4114 bscalar = scalarized_expr (matrix_b, list, 2);
4116 break;
4118 case A2B2T:
4119 inline_limit_check (matrix_a, matrix_b, m_case);
4121 u1 = get_size_m1 (matrix_b, 1);
4122 u2 = get_size_m1 (matrix_a, 2);
4123 u3 = get_size_m1 (matrix_a, 1);
4125 do_1 = create_do_loop (gfc_copy_expr (zero), u1, NULL, &co->loc, ns);
4126 do_2 = create_do_loop (gfc_copy_expr (zero), u2, NULL, &co->loc, ns);
4127 do_3 = create_do_loop (gfc_copy_expr (zero), u3, NULL, &co->loc, ns);
4129 do_1->block->next = do_2;
4130 do_2->block->next = do_3;
4131 do_3->block->next = assign_matmul;
4133 var_1 = do_1->ext.iterator->var;
4134 var_2 = do_2->ext.iterator->var;
4135 var_3 = do_3->ext.iterator->var;
4137 list[0] = var_3;
4138 list[1] = var_1;
4139 cscalar = scalarized_expr (co->expr1, list, 2);
4141 list[0] = var_3;
4142 list[1] = var_2;
4143 ascalar = scalarized_expr (matrix_a, list, 2);
4145 list[0] = var_1;
4146 list[1] = var_2;
4147 bscalar = scalarized_expr (matrix_b, list, 2);
4149 break;
4151 case A2TB2:
4152 inline_limit_check (matrix_a, matrix_b, m_case);
4154 u1 = get_size_m1 (matrix_a, 2);
4155 u2 = get_size_m1 (matrix_b, 2);
4156 u3 = get_size_m1 (matrix_a, 1);
4158 do_1 = create_do_loop (gfc_copy_expr (zero), u1, NULL, &co->loc, ns);
4159 do_2 = create_do_loop (gfc_copy_expr (zero), u2, NULL, &co->loc, ns);
4160 do_3 = create_do_loop (gfc_copy_expr (zero), u3, NULL, &co->loc, ns);
4162 do_1->block->next = do_2;
4163 do_2->block->next = do_3;
4164 do_3->block->next = assign_matmul;
4166 var_1 = do_1->ext.iterator->var;
4167 var_2 = do_2->ext.iterator->var;
4168 var_3 = do_3->ext.iterator->var;
4170 list[0] = var_1;
4171 list[1] = var_2;
4172 cscalar = scalarized_expr (co->expr1, list, 2);
4174 list[0] = var_3;
4175 list[1] = var_1;
4176 ascalar = scalarized_expr (matrix_a, list, 2);
4178 list[0] = var_3;
4179 list[1] = var_2;
4180 bscalar = scalarized_expr (matrix_b, list, 2);
4182 break;
4184 case A2B1:
4185 u1 = get_size_m1 (matrix_b, 1);
4186 u2 = get_size_m1 (matrix_a, 1);
4188 do_1 = create_do_loop (gfc_copy_expr (zero), u1, NULL, &co->loc, ns);
4189 do_2 = create_do_loop (gfc_copy_expr (zero), u2, NULL, &co->loc, ns);
4191 do_1->block->next = do_2;
4192 do_2->block->next = assign_matmul;
4194 var_1 = do_1->ext.iterator->var;
4195 var_2 = do_2->ext.iterator->var;
4197 list[0] = var_2;
4198 cscalar = scalarized_expr (co->expr1, list, 1);
4200 list[0] = var_2;
4201 list[1] = var_1;
4202 ascalar = scalarized_expr (matrix_a, list, 2);
4204 list[0] = var_1;
4205 bscalar = scalarized_expr (matrix_b, list, 1);
4207 break;
4209 case A1B2:
4210 u1 = get_size_m1 (matrix_b, 2);
4211 u2 = get_size_m1 (matrix_a, 1);
4213 do_1 = create_do_loop (gfc_copy_expr (zero), u1, NULL, &co->loc, ns);
4214 do_2 = create_do_loop (gfc_copy_expr (zero), u2, NULL, &co->loc, ns);
4216 do_1->block->next = do_2;
4217 do_2->block->next = assign_matmul;
4219 var_1 = do_1->ext.iterator->var;
4220 var_2 = do_2->ext.iterator->var;
4222 list[0] = var_1;
4223 cscalar = scalarized_expr (co->expr1, list, 1);
4225 list[0] = var_2;
4226 ascalar = scalarized_expr (matrix_a, list, 1);
4228 list[0] = var_2;
4229 list[1] = var_1;
4230 bscalar = scalarized_expr (matrix_b, list, 2);
4232 break;
4234 default:
4235 gcc_unreachable();
4238 /* Build the conjg call around the variables. Set the typespec manually
4239 because gfc_build_intrinsic_call sometimes gets this wrong. */
4240 if (conjg_a)
4242 gfc_typespec ts;
4243 ts = matrix_a->ts;
4244 ascalar = gfc_build_intrinsic_call (ns, GFC_ISYM_CONJG, "conjg",
4245 matrix_a->where, 1, ascalar);
4246 ascalar->ts = ts;
4249 if (conjg_b)
4251 gfc_typespec ts;
4252 ts = matrix_b->ts;
4253 bscalar = gfc_build_intrinsic_call (ns, GFC_ISYM_CONJG, "conjg",
4254 matrix_b->where, 1, bscalar);
4255 bscalar->ts = ts;
4257 /* First loop comes after the zero assignment. */
4258 assign_zero->next = do_1;
4260 /* Build the assignment expression in the loop. */
4261 assign_matmul->expr1 = gfc_copy_expr (cscalar);
4263 mult = get_operand (op_times, ascalar, bscalar);
4264 assign_matmul->expr2 = get_operand (op_plus, cscalar, mult);
4266 /* If we don't want to keep the original statement around in
4267 the else branch, we can free it. */
4269 if (if_limit == NULL)
4270 gfc_free_statements(co);
4271 else
4272 co->next = NULL;
4274 gfc_free_expr (zero);
4275 *walk_subtrees = 0;
4276 return 0;
4280 /* Code for index interchange for loops which are grouped together in DO
4281 CONCURRENT or FORALL statements. This is currently only applied if the
4282 iterations are grouped together in a single statement.
4284 For this transformation, it is assumed that memory access in strides is
4285 expensive, and that loops which access later indices (which access memory
4286 in bigger strides) should be moved to the first loops.
4288 For this, a loop over all the statements is executed, counting the times
4289 that the loop iteration values are accessed in each index. The loop
4290 indices are then sorted to minimize access to later indices from inner
4291 loops. */
4293 /* Type for holding index information. */
4295 typedef struct {
4296 gfc_symbol *sym;
4297 gfc_forall_iterator *fa;
4298 int num;
4299 int n[GFC_MAX_DIMENSIONS];
4300 } ind_type;
4302 /* Callback function to determine if an expression is the
4303 corresponding variable. */
4305 static int
4306 has_var (gfc_expr **e, int *walk_subtrees ATTRIBUTE_UNUSED, void *data)
4308 gfc_expr *expr = *e;
4309 gfc_symbol *sym;
4311 if (expr->expr_type != EXPR_VARIABLE)
4312 return 0;
4314 sym = (gfc_symbol *) data;
4315 return sym == expr->symtree->n.sym;
4318 /* Callback function to calculate the cost of a certain index. */
4320 static int
4321 index_cost (gfc_expr **e, int *walk_subtrees ATTRIBUTE_UNUSED,
4322 void *data)
4324 ind_type *ind;
4325 gfc_expr *expr;
4326 gfc_array_ref *ar;
4327 gfc_ref *ref;
4328 int i,j;
4330 expr = *e;
4331 if (expr->expr_type != EXPR_VARIABLE)
4332 return 0;
4334 ar = NULL;
4335 for (ref = expr->ref; ref; ref = ref->next)
4337 if (ref->type == REF_ARRAY)
4339 ar = &ref->u.ar;
4340 break;
4343 if (ar == NULL || ar->type != AR_ELEMENT)
4344 return 0;
4346 ind = (ind_type *) data;
4347 for (i = 0; i < ar->dimen; i++)
4349 for (j=0; ind[j].sym != NULL; j++)
4351 if (gfc_expr_walker (&ar->start[i], has_var, (void *) (ind[j].sym)))
4352 ind[j].n[i]++;
4355 return 0;
4358 /* Callback function for qsort, to sort the loop indices. */
4360 static int
4361 loop_comp (const void *e1, const void *e2)
4363 const ind_type *i1 = (const ind_type *) e1;
4364 const ind_type *i2 = (const ind_type *) e2;
4365 int i;
4367 for (i=GFC_MAX_DIMENSIONS-1; i >= 0; i--)
4369 if (i1->n[i] != i2->n[i])
4370 return i1->n[i] - i2->n[i];
4372 /* All other things being equal, let's not change the ordering. */
4373 return i2->num - i1->num;
4376 /* Main function to do the index interchange. */
4378 static int
4379 index_interchange (gfc_code **c, int *walk_subtrees ATTRIBUTE_UNUSED,
4380 void *data ATTRIBUTE_UNUSED)
4382 gfc_code *co;
4383 co = *c;
4384 int n_iter;
4385 gfc_forall_iterator *fa;
4386 ind_type *ind;
4387 int i, j;
4389 if (co->op != EXEC_FORALL && co->op != EXEC_DO_CONCURRENT)
4390 return 0;
4392 n_iter = 0;
4393 for (fa = co->ext.forall_iterator; fa; fa = fa->next)
4394 n_iter ++;
4396 /* Nothing to reorder. */
4397 if (n_iter < 2)
4398 return 0;
4400 ind = XALLOCAVEC (ind_type, n_iter + 1);
4402 i = 0;
4403 for (fa = co->ext.forall_iterator; fa; fa = fa->next)
4405 ind[i].sym = fa->var->symtree->n.sym;
4406 ind[i].fa = fa;
4407 for (j=0; j<GFC_MAX_DIMENSIONS; j++)
4408 ind[i].n[j] = 0;
4409 ind[i].num = i;
4410 i++;
4412 ind[n_iter].sym = NULL;
4413 ind[n_iter].fa = NULL;
4415 gfc_code_walker (c, gfc_dummy_code_callback, index_cost, (void *) ind);
4416 qsort ((void *) ind, n_iter, sizeof (ind_type), loop_comp);
4418 /* Do the actual index interchange. */
4419 co->ext.forall_iterator = fa = ind[0].fa;
4420 for (i=1; i<n_iter; i++)
4422 fa->next = ind[i].fa;
4423 fa = fa->next;
4425 fa->next = NULL;
4427 if (flag_warn_frontend_loop_interchange)
4429 for (i=1; i<n_iter; i++)
4431 if (ind[i-1].num > ind[i].num)
4433 gfc_warning (OPT_Wfrontend_loop_interchange,
4434 "Interchanging loops at %L", &co->loc);
4435 break;
4440 return 0;
4443 #define WALK_SUBEXPR(NODE) \
4444 do \
4446 result = gfc_expr_walker (&(NODE), exprfn, data); \
4447 if (result) \
4448 return result; \
4450 while (0)
4451 #define WALK_SUBEXPR_TAIL(NODE) e = &(NODE); continue
4453 /* Walk expression *E, calling EXPRFN on each expression in it. */
4456 gfc_expr_walker (gfc_expr **e, walk_expr_fn_t exprfn, void *data)
4458 while (*e)
4460 int walk_subtrees = 1;
4461 gfc_actual_arglist *a;
4462 gfc_ref *r;
4463 gfc_constructor *c;
4465 int result = exprfn (e, &walk_subtrees, data);
4466 if (result)
4467 return result;
4468 if (walk_subtrees)
4469 switch ((*e)->expr_type)
4471 case EXPR_OP:
4472 WALK_SUBEXPR ((*e)->value.op.op1);
4473 WALK_SUBEXPR_TAIL ((*e)->value.op.op2);
4474 break;
4475 case EXPR_FUNCTION:
4476 for (a = (*e)->value.function.actual; a; a = a->next)
4477 WALK_SUBEXPR (a->expr);
4478 break;
4479 case EXPR_COMPCALL:
4480 case EXPR_PPC:
4481 WALK_SUBEXPR ((*e)->value.compcall.base_object);
4482 for (a = (*e)->value.compcall.actual; a; a = a->next)
4483 WALK_SUBEXPR (a->expr);
4484 break;
4486 case EXPR_STRUCTURE:
4487 case EXPR_ARRAY:
4488 for (c = gfc_constructor_first ((*e)->value.constructor); c;
4489 c = gfc_constructor_next (c))
4491 if (c->iterator == NULL)
4492 WALK_SUBEXPR (c->expr);
4493 else
4495 iterator_level ++;
4496 WALK_SUBEXPR (c->expr);
4497 iterator_level --;
4498 WALK_SUBEXPR (c->iterator->var);
4499 WALK_SUBEXPR (c->iterator->start);
4500 WALK_SUBEXPR (c->iterator->end);
4501 WALK_SUBEXPR (c->iterator->step);
4505 if ((*e)->expr_type != EXPR_ARRAY)
4506 break;
4508 /* Fall through to the variable case in order to walk the
4509 reference. */
4510 gcc_fallthrough ();
4512 case EXPR_SUBSTRING:
4513 case EXPR_VARIABLE:
4514 for (r = (*e)->ref; r; r = r->next)
4516 gfc_array_ref *ar;
4517 int i;
4519 switch (r->type)
4521 case REF_ARRAY:
4522 ar = &r->u.ar;
4523 if (ar->type == AR_SECTION || ar->type == AR_ELEMENT)
4525 for (i=0; i< ar->dimen; i++)
4527 WALK_SUBEXPR (ar->start[i]);
4528 WALK_SUBEXPR (ar->end[i]);
4529 WALK_SUBEXPR (ar->stride[i]);
4533 break;
4535 case REF_SUBSTRING:
4536 WALK_SUBEXPR (r->u.ss.start);
4537 WALK_SUBEXPR (r->u.ss.end);
4538 break;
4540 case REF_COMPONENT:
4541 break;
4545 default:
4546 break;
4548 return 0;
4550 return 0;
4553 #define WALK_SUBCODE(NODE) \
4554 do \
4556 result = gfc_code_walker (&(NODE), codefn, exprfn, data); \
4557 if (result) \
4558 return result; \
4560 while (0)
4562 /* Walk code *C, calling CODEFN on each gfc_code node in it and calling EXPRFN
4563 on each expression in it. If any of the hooks returns non-zero, that
4564 value is immediately returned. If the hook sets *WALK_SUBTREES to 0,
4565 no subcodes or subexpressions are traversed. */
4568 gfc_code_walker (gfc_code **c, walk_code_fn_t codefn, walk_expr_fn_t exprfn,
4569 void *data)
4571 for (; *c; c = &(*c)->next)
4573 int walk_subtrees = 1;
4574 int result = codefn (c, &walk_subtrees, data);
4575 if (result)
4576 return result;
4578 if (walk_subtrees)
4580 gfc_code *b;
4581 gfc_actual_arglist *a;
4582 gfc_code *co;
4583 gfc_association_list *alist;
4584 bool saved_in_omp_workshare;
4585 bool saved_in_where;
4587 /* There might be statement insertions before the current code,
4588 which must not affect the expression walker. */
4590 co = *c;
4591 saved_in_omp_workshare = in_omp_workshare;
4592 saved_in_where = in_where;
4594 switch (co->op)
4597 case EXEC_BLOCK:
4598 WALK_SUBCODE (co->ext.block.ns->code);
4599 if (co->ext.block.assoc)
4601 bool saved_in_assoc_list = in_assoc_list;
4603 in_assoc_list = true;
4604 for (alist = co->ext.block.assoc; alist; alist = alist->next)
4605 WALK_SUBEXPR (alist->target);
4607 in_assoc_list = saved_in_assoc_list;
4610 break;
4612 case EXEC_DO:
4613 doloop_level ++;
4614 WALK_SUBEXPR (co->ext.iterator->var);
4615 WALK_SUBEXPR (co->ext.iterator->start);
4616 WALK_SUBEXPR (co->ext.iterator->end);
4617 WALK_SUBEXPR (co->ext.iterator->step);
4618 break;
4620 case EXEC_IF:
4621 if_level ++;
4622 break;
4624 case EXEC_WHERE:
4625 in_where = true;
4626 break;
4628 case EXEC_CALL:
4629 case EXEC_ASSIGN_CALL:
4630 for (a = co->ext.actual; a; a = a->next)
4631 WALK_SUBEXPR (a->expr);
4632 break;
4634 case EXEC_CALL_PPC:
4635 WALK_SUBEXPR (co->expr1);
4636 for (a = co->ext.actual; a; a = a->next)
4637 WALK_SUBEXPR (a->expr);
4638 break;
4640 case EXEC_SELECT:
4641 WALK_SUBEXPR (co->expr1);
4642 select_level ++;
4643 for (b = co->block; b; b = b->block)
4645 gfc_case *cp;
4646 for (cp = b->ext.block.case_list; cp; cp = cp->next)
4648 WALK_SUBEXPR (cp->low);
4649 WALK_SUBEXPR (cp->high);
4651 WALK_SUBCODE (b->next);
4653 continue;
4655 case EXEC_ALLOCATE:
4656 case EXEC_DEALLOCATE:
4658 gfc_alloc *a;
4659 for (a = co->ext.alloc.list; a; a = a->next)
4660 WALK_SUBEXPR (a->expr);
4661 break;
4664 case EXEC_FORALL:
4665 case EXEC_DO_CONCURRENT:
4667 gfc_forall_iterator *fa;
4668 for (fa = co->ext.forall_iterator; fa; fa = fa->next)
4670 WALK_SUBEXPR (fa->var);
4671 WALK_SUBEXPR (fa->start);
4672 WALK_SUBEXPR (fa->end);
4673 WALK_SUBEXPR (fa->stride);
4675 if (co->op == EXEC_FORALL)
4676 forall_level ++;
4677 break;
4680 case EXEC_OPEN:
4681 WALK_SUBEXPR (co->ext.open->unit);
4682 WALK_SUBEXPR (co->ext.open->file);
4683 WALK_SUBEXPR (co->ext.open->status);
4684 WALK_SUBEXPR (co->ext.open->access);
4685 WALK_SUBEXPR (co->ext.open->form);
4686 WALK_SUBEXPR (co->ext.open->recl);
4687 WALK_SUBEXPR (co->ext.open->blank);
4688 WALK_SUBEXPR (co->ext.open->position);
4689 WALK_SUBEXPR (co->ext.open->action);
4690 WALK_SUBEXPR (co->ext.open->delim);
4691 WALK_SUBEXPR (co->ext.open->pad);
4692 WALK_SUBEXPR (co->ext.open->iostat);
4693 WALK_SUBEXPR (co->ext.open->iomsg);
4694 WALK_SUBEXPR (co->ext.open->convert);
4695 WALK_SUBEXPR (co->ext.open->decimal);
4696 WALK_SUBEXPR (co->ext.open->encoding);
4697 WALK_SUBEXPR (co->ext.open->round);
4698 WALK_SUBEXPR (co->ext.open->sign);
4699 WALK_SUBEXPR (co->ext.open->asynchronous);
4700 WALK_SUBEXPR (co->ext.open->id);
4701 WALK_SUBEXPR (co->ext.open->newunit);
4702 WALK_SUBEXPR (co->ext.open->share);
4703 WALK_SUBEXPR (co->ext.open->cc);
4704 break;
4706 case EXEC_CLOSE:
4707 WALK_SUBEXPR (co->ext.close->unit);
4708 WALK_SUBEXPR (co->ext.close->status);
4709 WALK_SUBEXPR (co->ext.close->iostat);
4710 WALK_SUBEXPR (co->ext.close->iomsg);
4711 break;
4713 case EXEC_BACKSPACE:
4714 case EXEC_ENDFILE:
4715 case EXEC_REWIND:
4716 case EXEC_FLUSH:
4717 WALK_SUBEXPR (co->ext.filepos->unit);
4718 WALK_SUBEXPR (co->ext.filepos->iostat);
4719 WALK_SUBEXPR (co->ext.filepos->iomsg);
4720 break;
4722 case EXEC_INQUIRE:
4723 WALK_SUBEXPR (co->ext.inquire->unit);
4724 WALK_SUBEXPR (co->ext.inquire->file);
4725 WALK_SUBEXPR (co->ext.inquire->iomsg);
4726 WALK_SUBEXPR (co->ext.inquire->iostat);
4727 WALK_SUBEXPR (co->ext.inquire->exist);
4728 WALK_SUBEXPR (co->ext.inquire->opened);
4729 WALK_SUBEXPR (co->ext.inquire->number);
4730 WALK_SUBEXPR (co->ext.inquire->named);
4731 WALK_SUBEXPR (co->ext.inquire->name);
4732 WALK_SUBEXPR (co->ext.inquire->access);
4733 WALK_SUBEXPR (co->ext.inquire->sequential);
4734 WALK_SUBEXPR (co->ext.inquire->direct);
4735 WALK_SUBEXPR (co->ext.inquire->form);
4736 WALK_SUBEXPR (co->ext.inquire->formatted);
4737 WALK_SUBEXPR (co->ext.inquire->unformatted);
4738 WALK_SUBEXPR (co->ext.inquire->recl);
4739 WALK_SUBEXPR (co->ext.inquire->nextrec);
4740 WALK_SUBEXPR (co->ext.inquire->blank);
4741 WALK_SUBEXPR (co->ext.inquire->position);
4742 WALK_SUBEXPR (co->ext.inquire->action);
4743 WALK_SUBEXPR (co->ext.inquire->read);
4744 WALK_SUBEXPR (co->ext.inquire->write);
4745 WALK_SUBEXPR (co->ext.inquire->readwrite);
4746 WALK_SUBEXPR (co->ext.inquire->delim);
4747 WALK_SUBEXPR (co->ext.inquire->encoding);
4748 WALK_SUBEXPR (co->ext.inquire->pad);
4749 WALK_SUBEXPR (co->ext.inquire->iolength);
4750 WALK_SUBEXPR (co->ext.inquire->convert);
4751 WALK_SUBEXPR (co->ext.inquire->strm_pos);
4752 WALK_SUBEXPR (co->ext.inquire->asynchronous);
4753 WALK_SUBEXPR (co->ext.inquire->decimal);
4754 WALK_SUBEXPR (co->ext.inquire->pending);
4755 WALK_SUBEXPR (co->ext.inquire->id);
4756 WALK_SUBEXPR (co->ext.inquire->sign);
4757 WALK_SUBEXPR (co->ext.inquire->size);
4758 WALK_SUBEXPR (co->ext.inquire->round);
4759 break;
4761 case EXEC_WAIT:
4762 WALK_SUBEXPR (co->ext.wait->unit);
4763 WALK_SUBEXPR (co->ext.wait->iostat);
4764 WALK_SUBEXPR (co->ext.wait->iomsg);
4765 WALK_SUBEXPR (co->ext.wait->id);
4766 break;
4768 case EXEC_READ:
4769 case EXEC_WRITE:
4770 WALK_SUBEXPR (co->ext.dt->io_unit);
4771 WALK_SUBEXPR (co->ext.dt->format_expr);
4772 WALK_SUBEXPR (co->ext.dt->rec);
4773 WALK_SUBEXPR (co->ext.dt->advance);
4774 WALK_SUBEXPR (co->ext.dt->iostat);
4775 WALK_SUBEXPR (co->ext.dt->size);
4776 WALK_SUBEXPR (co->ext.dt->iomsg);
4777 WALK_SUBEXPR (co->ext.dt->id);
4778 WALK_SUBEXPR (co->ext.dt->pos);
4779 WALK_SUBEXPR (co->ext.dt->asynchronous);
4780 WALK_SUBEXPR (co->ext.dt->blank);
4781 WALK_SUBEXPR (co->ext.dt->decimal);
4782 WALK_SUBEXPR (co->ext.dt->delim);
4783 WALK_SUBEXPR (co->ext.dt->pad);
4784 WALK_SUBEXPR (co->ext.dt->round);
4785 WALK_SUBEXPR (co->ext.dt->sign);
4786 WALK_SUBEXPR (co->ext.dt->extra_comma);
4787 break;
4789 case EXEC_OMP_PARALLEL:
4790 case EXEC_OMP_PARALLEL_DO:
4791 case EXEC_OMP_PARALLEL_DO_SIMD:
4792 case EXEC_OMP_PARALLEL_SECTIONS:
4794 in_omp_workshare = false;
4796 /* This goto serves as a shortcut to avoid code
4797 duplication or a larger if or switch statement. */
4798 goto check_omp_clauses;
4800 case EXEC_OMP_WORKSHARE:
4801 case EXEC_OMP_PARALLEL_WORKSHARE:
4803 in_omp_workshare = true;
4805 /* Fall through */
4807 case EXEC_OMP_CRITICAL:
4808 case EXEC_OMP_DISTRIBUTE:
4809 case EXEC_OMP_DISTRIBUTE_PARALLEL_DO:
4810 case EXEC_OMP_DISTRIBUTE_PARALLEL_DO_SIMD:
4811 case EXEC_OMP_DISTRIBUTE_SIMD:
4812 case EXEC_OMP_DO:
4813 case EXEC_OMP_DO_SIMD:
4814 case EXEC_OMP_ORDERED:
4815 case EXEC_OMP_SECTIONS:
4816 case EXEC_OMP_SINGLE:
4817 case EXEC_OMP_END_SINGLE:
4818 case EXEC_OMP_SIMD:
4819 case EXEC_OMP_TASKLOOP:
4820 case EXEC_OMP_TASKLOOP_SIMD:
4821 case EXEC_OMP_TARGET:
4822 case EXEC_OMP_TARGET_DATA:
4823 case EXEC_OMP_TARGET_ENTER_DATA:
4824 case EXEC_OMP_TARGET_EXIT_DATA:
4825 case EXEC_OMP_TARGET_PARALLEL:
4826 case EXEC_OMP_TARGET_PARALLEL_DO:
4827 case EXEC_OMP_TARGET_PARALLEL_DO_SIMD:
4828 case EXEC_OMP_TARGET_SIMD:
4829 case EXEC_OMP_TARGET_TEAMS:
4830 case EXEC_OMP_TARGET_TEAMS_DISTRIBUTE:
4831 case EXEC_OMP_TARGET_TEAMS_DISTRIBUTE_PARALLEL_DO:
4832 case EXEC_OMP_TARGET_TEAMS_DISTRIBUTE_PARALLEL_DO_SIMD:
4833 case EXEC_OMP_TARGET_TEAMS_DISTRIBUTE_SIMD:
4834 case EXEC_OMP_TARGET_UPDATE:
4835 case EXEC_OMP_TASK:
4836 case EXEC_OMP_TEAMS:
4837 case EXEC_OMP_TEAMS_DISTRIBUTE:
4838 case EXEC_OMP_TEAMS_DISTRIBUTE_PARALLEL_DO:
4839 case EXEC_OMP_TEAMS_DISTRIBUTE_PARALLEL_DO_SIMD:
4840 case EXEC_OMP_TEAMS_DISTRIBUTE_SIMD:
4842 /* Come to this label only from the
4843 EXEC_OMP_PARALLEL_* cases above. */
4845 check_omp_clauses:
4847 if (co->ext.omp_clauses)
4849 gfc_omp_namelist *n;
4850 static int list_types[]
4851 = { OMP_LIST_ALIGNED, OMP_LIST_LINEAR, OMP_LIST_DEPEND,
4852 OMP_LIST_MAP, OMP_LIST_TO, OMP_LIST_FROM };
4853 size_t idx;
4854 WALK_SUBEXPR (co->ext.omp_clauses->if_expr);
4855 WALK_SUBEXPR (co->ext.omp_clauses->final_expr);
4856 WALK_SUBEXPR (co->ext.omp_clauses->num_threads);
4857 WALK_SUBEXPR (co->ext.omp_clauses->chunk_size);
4858 WALK_SUBEXPR (co->ext.omp_clauses->safelen_expr);
4859 WALK_SUBEXPR (co->ext.omp_clauses->simdlen_expr);
4860 WALK_SUBEXPR (co->ext.omp_clauses->num_teams);
4861 WALK_SUBEXPR (co->ext.omp_clauses->device);
4862 WALK_SUBEXPR (co->ext.omp_clauses->thread_limit);
4863 WALK_SUBEXPR (co->ext.omp_clauses->dist_chunk_size);
4864 WALK_SUBEXPR (co->ext.omp_clauses->grainsize);
4865 WALK_SUBEXPR (co->ext.omp_clauses->hint);
4866 WALK_SUBEXPR (co->ext.omp_clauses->num_tasks);
4867 WALK_SUBEXPR (co->ext.omp_clauses->priority);
4868 for (idx = 0; idx < OMP_IF_LAST; idx++)
4869 WALK_SUBEXPR (co->ext.omp_clauses->if_exprs[idx]);
4870 for (idx = 0;
4871 idx < sizeof (list_types) / sizeof (list_types[0]);
4872 idx++)
4873 for (n = co->ext.omp_clauses->lists[list_types[idx]];
4874 n; n = n->next)
4875 WALK_SUBEXPR (n->expr);
4877 break;
4878 default:
4879 break;
4882 WALK_SUBEXPR (co->expr1);
4883 WALK_SUBEXPR (co->expr2);
4884 WALK_SUBEXPR (co->expr3);
4885 WALK_SUBEXPR (co->expr4);
4886 for (b = co->block; b; b = b->block)
4888 WALK_SUBEXPR (b->expr1);
4889 WALK_SUBEXPR (b->expr2);
4890 WALK_SUBCODE (b->next);
4893 if (co->op == EXEC_FORALL)
4894 forall_level --;
4896 if (co->op == EXEC_DO)
4897 doloop_level --;
4899 if (co->op == EXEC_IF)
4900 if_level --;
4902 if (co->op == EXEC_SELECT)
4903 select_level --;
4905 in_omp_workshare = saved_in_omp_workshare;
4906 in_where = saved_in_where;
4909 return 0;