gcc/tree-data-ref.c

   1 /* Data references and dependences detectors.
   2    Copyright (C) 2003-2015 Free Software Foundation, Inc.
   3    Contributed by Sebastian Pop <pop@cri.ensmp.fr>
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /* This pass walks a given loop structure searching for array
  22    references.  The information about the array accesses is recorded
  23    in DATA_REFERENCE structures.
  24
  25    The basic test for determining the dependences is:
  26    given two access functions chrec1 and chrec2 to a same array, and
  27    x and y two vectors from the iteration domain, the same element of
  28    the array is accessed twice at iterations x and y if and only if:
  29    |             chrec1 (x) == chrec2 (y).
  30
  31    The goals of this analysis are:
  32
  33    - to determine the independence: the relation between two
  34      independent accesses is qualified with the chrec_known (this
  35      information allows a loop parallelization),
  36
  37    - when two data references access the same data, to qualify the
  38      dependence relation with classic dependence representations:
  39
  40        - distance vectors
  41        - direction vectors
  42        - loop carried level dependence
  43        - polyhedron dependence
  44      or with the chains of recurrences based representation,
  45
  46    - to define a knowledge base for storing the data dependence
  47      information,
  48
  49    - to define an interface to access this data.
  50
  51
  52    Definitions:
  53
  54    - subscript: given two array accesses a subscript is the tuple
  55    composed of the access functions for a given dimension.  Example:
  56    Given A[f1][f2][f3] and B[g1][g2][g3], there are three subscripts:
  57    (f1, g1), (f2, g2), (f3, g3).
  58
  59    - Diophantine equation: an equation whose coefficients and
  60    solutions are integer constants, for example the equation
  61    |   3*x + 2*y = 1
  62    has an integer solution x = 1 and y = -1.
  63
  64    References:
  65
  66    - "Advanced Compilation for High Performance Computing" by Randy
  67    Allen and Ken Kennedy.
  68    http://citeseer.ist.psu.edu/goff91practical.html
  69
  70    - "Loop Transformations for Restructuring Compilers - The Foundations"
  71    by Utpal Banerjee.
  72
  73
  74 */
  75
  76 #include "config.h"
  77 #include "system.h"
  78 #include "coretypes.h"
  79 #include "alias.h"
  80 #include "backend.h"
  81 #include "tree.h"
  82 #include "gimple.h"
  83 #include "rtl.h"
  84 #include "options.h"
  85 #include "fold-const.h"
  86 #include "flags.h"
  87 #include "insn-config.h"
  88 #include "expmed.h"
  89 #include "dojump.h"
  90 #include "explow.h"
  91 #include "calls.h"
  92 #include "emit-rtl.h"
  93 #include "varasm.h"
  94 #include "stmt.h"
  95 #include "expr.h"
  96 #include "gimple-pretty-print.h"
  97 #include "internal-fn.h"
  98 #include "gimple-iterator.h"
  99 #include "tree-ssa-loop-niter.h"
 100 #include "tree-ssa-loop.h"
 101 #include "tree-ssa.h"
 102 #include "cfgloop.h"
 103 #include "tree-data-ref.h"
 104 #include "tree-scalar-evolution.h"
 105 #include "dumpfile.h"
 106 #include "langhooks.h"
 107 #include "tree-affine.h"
 108 #include "params.h"
 109
 110 static struct datadep_stats
 111 {
 112   int num_dependence_tests;
 113   int num_dependence_dependent;
 114   int num_dependence_independent;
 115   int num_dependence_undetermined;
 116
 117   int num_subscript_tests;
 118   int num_subscript_undetermined;
 119   int num_same_subscript_function;
 120
 121   int num_ziv;
 122   int num_ziv_independent;
 123   int num_ziv_dependent;
 124   int num_ziv_unimplemented;
 125
 126   int num_siv;
 127   int num_siv_independent;
 128   int num_siv_dependent;
 129   int num_siv_unimplemented;
 130
 131   int num_miv;
 132   int num_miv_independent;
 133   int num_miv_dependent;
 134   int num_miv_unimplemented;
 135 } dependence_stats;
 136
 137 static bool subscript_dependence_tester_1 (struct data_dependence_relation *,
 138                                            struct data_reference *,
 139                                            struct data_reference *,
 140                                            struct loop *);
 141 /* Returns true iff A divides B.  */
 142
 143 static inline bool
 144 tree_fold_divides_p (const_tree a, const_tree b)
 145 {
 146   gcc_assert (TREE_CODE (a) == INTEGER_CST);
 147   gcc_assert (TREE_CODE (b) == INTEGER_CST);
 148   return integer_zerop (int_const_binop (TRUNC_MOD_EXPR, b, a));
 149 }
 150
 151 /* Returns true iff A divides B.  */
 152
 153 static inline bool
 154 int_divides_p (int a, int b)
 155 {
 156   return ((b % a) == 0);
 157 }
 158
 159 \f
 160
 161 /* Dump into FILE all the data references from DATAREFS.  */
 162
 163 static void
 164 dump_data_references (FILE *file, vec<data_reference_p> datarefs)
 165 {
 166   unsigned int i;
 167   struct data_reference *dr;
 168
 169   FOR_EACH_VEC_ELT (datarefs, i, dr)
 170     dump_data_reference (file, dr);
 171 }
 172
 173 /* Unified dump into FILE all the data references from DATAREFS.  */
 174
 175 DEBUG_FUNCTION void
 176 debug (vec<data_reference_p> &ref)
 177 {
 178   dump_data_references (stderr, ref);
 179 }
 180
 181 DEBUG_FUNCTION void
 182 debug (vec<data_reference_p> *ptr)
 183 {
 184   if (ptr)
 185     debug (*ptr);
 186   else
 187     fprintf (stderr, "<nil>\n");
 188 }
 189
 190
 191 /* Dump into STDERR all the data references from DATAREFS.  */
 192
 193 DEBUG_FUNCTION void
 194 debug_data_references (vec<data_reference_p> datarefs)
 195 {
 196   dump_data_references (stderr, datarefs);
 197 }
 198
 199 /* Print to STDERR the data_reference DR.  */
 200
 201 DEBUG_FUNCTION void
 202 debug_data_reference (struct data_reference *dr)
 203 {
 204   dump_data_reference (stderr, dr);
 205 }
 206
 207 /* Dump function for a DATA_REFERENCE structure.  */
 208
 209 void
 210 dump_data_reference (FILE *outf,
 211                      struct data_reference *dr)
 212 {
 213   unsigned int i;
 214
 215   fprintf (outf, "#(Data Ref: \n");
 216   fprintf (outf, "#  bb: %d \n", gimple_bb (DR_STMT (dr))->index);
 217   fprintf (outf, "#  stmt: ");
 218   print_gimple_stmt (outf, DR_STMT (dr), 0, 0);
 219   fprintf (outf, "#  ref: ");
 220   print_generic_stmt (outf, DR_REF (dr), 0);
 221   fprintf (outf, "#  base_object: ");
 222   print_generic_stmt (outf, DR_BASE_OBJECT (dr), 0);
 223
 224   for (i = 0; i < DR_NUM_DIMENSIONS (dr); i++)
 225     {
 226       fprintf (outf, "#  Access function %d: ", i);
 227       print_generic_stmt (outf, DR_ACCESS_FN (dr, i), 0);
 228     }
 229   fprintf (outf, "#)\n");
 230 }
 231
 232 /* Unified dump function for a DATA_REFERENCE structure.  */
 233
 234 DEBUG_FUNCTION void
 235 debug (data_reference &ref)
 236 {
 237   dump_data_reference (stderr, &ref);
 238 }
 239
 240 DEBUG_FUNCTION void
 241 debug (data_reference *ptr)
 242 {
 243   if (ptr)
 244     debug (*ptr);
 245   else
 246     fprintf (stderr, "<nil>\n");
 247 }
 248
 249
 250 /* Dumps the affine function described by FN to the file OUTF.  */
 251
 252 DEBUG_FUNCTION void
 253 dump_affine_function (FILE *outf, affine_fn fn)
 254 {
 255   unsigned i;
 256   tree coef;
 257
 258   print_generic_expr (outf, fn[0], TDF_SLIM);
 259   for (i = 1; fn.iterate (i, &coef); i++)
 260     {
 261       fprintf (outf, " + ");
 262       print_generic_expr (outf, coef, TDF_SLIM);
 263       fprintf (outf, " * x_%u", i);
 264     }
 265 }
 266
 267 /* Dumps the conflict function CF to the file OUTF.  */
 268
 269 DEBUG_FUNCTION void
 270 dump_conflict_function (FILE *outf, conflict_function *cf)
 271 {
 272   unsigned i;
 273
 274   if (cf->n == NO_DEPENDENCE)
 275     fprintf (outf, "no dependence");
 276   else if (cf->n == NOT_KNOWN)
 277     fprintf (outf, "not known");
 278   else
 279     {
 280       for (i = 0; i < cf->n; i++)
 281         {
 282           if (i != 0)
 283             fprintf (outf, " ");
 284           fprintf (outf, "[");
 285           dump_affine_function (outf, cf->fns[i]);
 286           fprintf (outf, "]");
 287         }
 288     }
 289 }
 290
 291 /* Dump function for a SUBSCRIPT structure.  */
 292
 293 DEBUG_FUNCTION void
 294 dump_subscript (FILE *outf, struct subscript *subscript)
 295 {
 296   conflict_function *cf = SUB_CONFLICTS_IN_A (subscript);
 297
 298   fprintf (outf, "\n (subscript \n");
 299   fprintf (outf, "  iterations_that_access_an_element_twice_in_A: ");
 300   dump_conflict_function (outf, cf);
 301   if (CF_NONTRIVIAL_P (cf))
 302     {
 303       tree last_iteration = SUB_LAST_CONFLICT (subscript);
 304       fprintf (outf, "\n  last_conflict: ");
 305       print_generic_expr (outf, last_iteration, 0);
 306     }
 307
 308   cf = SUB_CONFLICTS_IN_B (subscript);
 309   fprintf (outf, "\n  iterations_that_access_an_element_twice_in_B: ");
 310   dump_conflict_function (outf, cf);
 311   if (CF_NONTRIVIAL_P (cf))
 312     {
 313       tree last_iteration = SUB_LAST_CONFLICT (subscript);
 314       fprintf (outf, "\n  last_conflict: ");
 315       print_generic_expr (outf, last_iteration, 0);
 316     }
 317
 318   fprintf (outf, "\n  (Subscript distance: ");
 319   print_generic_expr (outf, SUB_DISTANCE (subscript), 0);
 320   fprintf (outf, " ))\n");
 321 }
 322
 323 /* Print the classic direction vector DIRV to OUTF.  */
 324
 325 DEBUG_FUNCTION void
 326 print_direction_vector (FILE *outf,
 327                         lambda_vector dirv,
 328                         int length)
 329 {
 330   int eq;
 331
 332   for (eq = 0; eq < length; eq++)
 333     {
 334       enum data_dependence_direction dir = ((enum data_dependence_direction)
 335                                             dirv[eq]);
 336
 337       switch (dir)
 338         {
 339         case dir_positive:
 340           fprintf (outf, "    +");
 341           break;
 342         case dir_negative:
 343           fprintf (outf, "    -");
 344           break;
 345         case dir_equal:
 346           fprintf (outf, "    =");
 347           break;
 348         case dir_positive_or_equal:
 349           fprintf (outf, "   +=");
 350           break;
 351         case dir_positive_or_negative:
 352           fprintf (outf, "   +-");
 353           break;
 354         case dir_negative_or_equal:
 355           fprintf (outf, "   -=");
 356           break;
 357         case dir_star:
 358           fprintf (outf, "    *");
 359           break;
 360         default:
 361           fprintf (outf, "indep");
 362           break;
 363         }
 364     }
 365   fprintf (outf, "\n");
 366 }
 367
 368 /* Print a vector of direction vectors.  */
 369
 370 DEBUG_FUNCTION void
 371 print_dir_vectors (FILE *outf, vec<lambda_vector> dir_vects,
 372                    int length)
 373 {
 374   unsigned j;
 375   lambda_vector v;
 376
 377   FOR_EACH_VEC_ELT (dir_vects, j, v)
 378     print_direction_vector (outf, v, length);
 379 }
 380
 381 /* Print out a vector VEC of length N to OUTFILE.  */
 382
 383 DEBUG_FUNCTION void
 384 print_lambda_vector (FILE * outfile, lambda_vector vector, int n)
 385 {
 386   int i;
 387
 388   for (i = 0; i < n; i++)
 389     fprintf (outfile, "%3d ", vector[i]);
 390   fprintf (outfile, "\n");
 391 }
 392
 393 /* Print a vector of distance vectors.  */
 394
 395 DEBUG_FUNCTION void
 396 print_dist_vectors (FILE *outf, vec<lambda_vector> dist_vects,
 397                     int length)
 398 {
 399   unsigned j;
 400   lambda_vector v;
 401
 402   FOR_EACH_VEC_ELT (dist_vects, j, v)
 403     print_lambda_vector (outf, v, length);
 404 }
 405
 406 /* Dump function for a DATA_DEPENDENCE_RELATION structure.  */
 407
 408 DEBUG_FUNCTION void
 409 dump_data_dependence_relation (FILE *outf,
 410                                struct data_dependence_relation *ddr)
 411 {
 412   struct data_reference *dra, *drb;
 413
 414   fprintf (outf, "(Data Dep: \n");
 415
 416   if (!ddr || DDR_ARE_DEPENDENT (ddr) == chrec_dont_know)
 417     {
 418       if (ddr)
 419         {
 420           dra = DDR_A (ddr);
 421           drb = DDR_B (ddr);
 422           if (dra)
 423             dump_data_reference (outf, dra);
 424           else
 425             fprintf (outf, "    (nil)\n");
 426           if (drb)
 427             dump_data_reference (outf, drb);
 428           else
 429             fprintf (outf, "    (nil)\n");
 430         }
 431       fprintf (outf, "    (don't know)\n)\n");
 432       return;
 433     }
 434
 435   dra = DDR_A (ddr);
 436   drb = DDR_B (ddr);
 437   dump_data_reference (outf, dra);
 438   dump_data_reference (outf, drb);
 439
 440   if (DDR_ARE_DEPENDENT (ddr) == chrec_known)
 441     fprintf (outf, "    (no dependence)\n");
 442
 443   else if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
 444     {
 445       unsigned int i;
 446       struct loop *loopi;
 447
 448       for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
 449         {
 450           fprintf (outf, "  access_fn_A: ");
 451           print_generic_stmt (outf, DR_ACCESS_FN (dra, i), 0);
 452           fprintf (outf, "  access_fn_B: ");
 453           print_generic_stmt (outf, DR_ACCESS_FN (drb, i), 0);
 454           dump_subscript (outf, DDR_SUBSCRIPT (ddr, i));
 455         }
 456
 457       fprintf (outf, "  inner loop index: %d\n", DDR_INNER_LOOP (ddr));
 458       fprintf (outf, "  loop nest: (");
 459       FOR_EACH_VEC_ELT (DDR_LOOP_NEST (ddr), i, loopi)
 460         fprintf (outf, "%d ", loopi->num);
 461       fprintf (outf, ")\n");
 462
 463       for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
 464         {
 465           fprintf (outf, "  distance_vector: ");
 466           print_lambda_vector (outf, DDR_DIST_VECT (ddr, i),
 467                                DDR_NB_LOOPS (ddr));
 468         }
 469
 470       for (i = 0; i < DDR_NUM_DIR_VECTS (ddr); i++)
 471         {
 472           fprintf (outf, "  direction_vector: ");
 473           print_direction_vector (outf, DDR_DIR_VECT (ddr, i),
 474                                   DDR_NB_LOOPS (ddr));
 475         }
 476     }
 477
 478   fprintf (outf, ")\n");
 479 }
 480
 481 /* Debug version.  */
 482
 483 DEBUG_FUNCTION void
 484 debug_data_dependence_relation (struct data_dependence_relation *ddr)
 485 {
 486   dump_data_dependence_relation (stderr, ddr);
 487 }
 488
 489 /* Dump into FILE all the dependence relations from DDRS.  */
 490
 491 DEBUG_FUNCTION void
 492 dump_data_dependence_relations (FILE *file,
 493                                 vec<ddr_p> ddrs)
 494 {
 495   unsigned int i;
 496   struct data_dependence_relation *ddr;
 497
 498   FOR_EACH_VEC_ELT (ddrs, i, ddr)
 499     dump_data_dependence_relation (file, ddr);
 500 }
 501
 502 DEBUG_FUNCTION void
 503 debug (vec<ddr_p> &ref)
 504 {
 505   dump_data_dependence_relations (stderr, ref);
 506 }
 507
 508 DEBUG_FUNCTION void
 509 debug (vec<ddr_p> *ptr)
 510 {
 511   if (ptr)
 512     debug (*ptr);
 513   else
 514     fprintf (stderr, "<nil>\n");
 515 }
 516
 517
 518 /* Dump to STDERR all the dependence relations from DDRS.  */
 519
 520 DEBUG_FUNCTION void
 521 debug_data_dependence_relations (vec<ddr_p> ddrs)
 522 {
 523   dump_data_dependence_relations (stderr, ddrs);
 524 }
 525
 526 /* Dumps the distance and direction vectors in FILE.  DDRS contains
 527    the dependence relations, and VECT_SIZE is the size of the
 528    dependence vectors, or in other words the number of loops in the
 529    considered nest.  */
 530
 531 DEBUG_FUNCTION void
 532 dump_dist_dir_vectors (FILE *file, vec<ddr_p> ddrs)
 533 {
 534   unsigned int i, j;
 535   struct data_dependence_relation *ddr;
 536   lambda_vector v;
 537
 538   FOR_EACH_VEC_ELT (ddrs, i, ddr)
 539     if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE && DDR_AFFINE_P (ddr))
 540       {
 541         FOR_EACH_VEC_ELT (DDR_DIST_VECTS (ddr), j, v)
 542           {
 543             fprintf (file, "DISTANCE_V (");
 544             print_lambda_vector (file, v, DDR_NB_LOOPS (ddr));
 545             fprintf (file, ")\n");
 546           }
 547
 548         FOR_EACH_VEC_ELT (DDR_DIR_VECTS (ddr), j, v)
 549           {
 550             fprintf (file, "DIRECTION_V (");
 551             print_direction_vector (file, v, DDR_NB_LOOPS (ddr));
 552             fprintf (file, ")\n");
 553           }
 554       }
 555
 556   fprintf (file, "\n\n");
 557 }
 558
 559 /* Dumps the data dependence relations DDRS in FILE.  */
 560
 561 DEBUG_FUNCTION void
 562 dump_ddrs (FILE *file, vec<ddr_p> ddrs)
 563 {
 564   unsigned int i;
 565   struct data_dependence_relation *ddr;
 566
 567   FOR_EACH_VEC_ELT (ddrs, i, ddr)
 568     dump_data_dependence_relation (file, ddr);
 569
 570   fprintf (file, "\n\n");
 571 }
 572
 573 DEBUG_FUNCTION void
 574 debug_ddrs (vec<ddr_p> ddrs)
 575 {
 576   dump_ddrs (stderr, ddrs);
 577 }
 578
 579 /* Helper function for split_constant_offset.  Expresses OP0 CODE OP1
 580    (the type of the result is TYPE) as VAR + OFF, where OFF is a nonzero
 581    constant of type ssizetype, and returns true.  If we cannot do this
 582    with OFF nonzero, OFF and VAR are set to NULL_TREE instead and false
 583    is returned.  */
 584
 585 static bool
 586 split_constant_offset_1 (tree type, tree op0, enum tree_code code, tree op1,
 587                          tree *var, tree *off)
 588 {
 589   tree var0, var1;
 590   tree off0, off1;
 591   enum tree_code ocode = code;
 592
 593   *var = NULL_TREE;
 594   *off = NULL_TREE;
 595
 596   switch (code)
 597     {
 598     case INTEGER_CST:
 599       *var = build_int_cst (type, 0);
 600       *off = fold_convert (ssizetype, op0);
 601       return true;
 602
 603     case POINTER_PLUS_EXPR:
 604       ocode = PLUS_EXPR;
 605       /* FALLTHROUGH */
 606     case PLUS_EXPR:
 607     case MINUS_EXPR:
 608       split_constant_offset (op0, &var0, &off0);
 609       split_constant_offset (op1, &var1, &off1);
 610       *var = fold_build2 (code, type, var0, var1);
 611       *off = size_binop (ocode, off0, off1);
 612       return true;
 613
 614     case MULT_EXPR:
 615       if (TREE_CODE (op1) != INTEGER_CST)
 616         return false;
 617
 618       split_constant_offset (op0, &var0, &off0);
 619       *var = fold_build2 (MULT_EXPR, type, var0, op1);
 620       *off = size_binop (MULT_EXPR, off0, fold_convert (ssizetype, op1));
 621       return true;
 622
 623     case ADDR_EXPR:
 624       {
 625         tree base, poffset;
 626         HOST_WIDE_INT pbitsize, pbitpos;
 627         machine_mode pmode;
 628         int punsignedp, pvolatilep;
 629
 630         op0 = TREE_OPERAND (op0, 0);
 631         base = get_inner_reference (op0, &pbitsize, &pbitpos, &poffset,
 632                                     &pmode, &punsignedp, &pvolatilep, false);
 633
 634         if (pbitpos % BITS_PER_UNIT != 0)
 635           return false;
 636         base = build_fold_addr_expr (base);
 637         off0 = ssize_int (pbitpos / BITS_PER_UNIT);
 638
 639         if (poffset)
 640           {
 641             split_constant_offset (poffset, &poffset, &off1);
 642             off0 = size_binop (PLUS_EXPR, off0, off1);
 643             if (POINTER_TYPE_P (TREE_TYPE (base)))
 644               base = fold_build_pointer_plus (base, poffset);
 645             else
 646               base = fold_build2 (PLUS_EXPR, TREE_TYPE (base), base,
 647                                   fold_convert (TREE_TYPE (base), poffset));
 648           }
 649
 650         var0 = fold_convert (type, base);
 651
 652         /* If variable length types are involved, punt, otherwise casts
 653            might be converted into ARRAY_REFs in gimplify_conversion.
 654            To compute that ARRAY_REF's element size TYPE_SIZE_UNIT, which
 655            possibly no longer appears in current GIMPLE, might resurface.
 656            This perhaps could run
 657            if (CONVERT_EXPR_P (var0))
 658              {
 659                gimplify_conversion (&var0);
 660                // Attempt to fill in any within var0 found ARRAY_REF's
 661                // element size from corresponding op embedded ARRAY_REF,
 662                // if unsuccessful, just punt.
 663              }  */
 664         while (POINTER_TYPE_P (type))
 665           type = TREE_TYPE (type);
 666         if (int_size_in_bytes (type) < 0)
 667           return false;
 668
 669         *var = var0;
 670         *off = off0;
 671         return true;
 672       }
 673
 674     case SSA_NAME:
 675       {
 676         if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (op0))
 677           return false;
 678
 679         gimple def_stmt = SSA_NAME_DEF_STMT (op0);
 680         enum tree_code subcode;
 681
 682         if (gimple_code (def_stmt) != GIMPLE_ASSIGN)
 683           return false;
 684
 685         var0 = gimple_assign_rhs1 (def_stmt);
 686         subcode = gimple_assign_rhs_code (def_stmt);
 687         var1 = gimple_assign_rhs2 (def_stmt);
 688
 689         return split_constant_offset_1 (type, var0, subcode, var1, var, off);
 690       }
 691     CASE_CONVERT:
 692       {
 693         /* We must not introduce undefined overflow, and we must not change the value.
 694            Hence we're okay if the inner type doesn't overflow to start with
 695            (pointer or signed), the outer type also is an integer or pointer
 696            and the outer precision is at least as large as the inner.  */
 697         tree itype = TREE_TYPE (op0);
 698         if ((POINTER_TYPE_P (itype)
 699              || (INTEGRAL_TYPE_P (itype) && TYPE_OVERFLOW_UNDEFINED (itype)))
 700             && TYPE_PRECISION (type) >= TYPE_PRECISION (itype)
 701             && (POINTER_TYPE_P (type) || INTEGRAL_TYPE_P (type)))
 702           {
 703             split_constant_offset (op0, &var0, off);
 704             *var = fold_convert (type, var0);
 705             return true;
 706           }
 707         return false;
 708       }
 709
 710     default:
 711       return false;
 712     }
 713 }
 714
 715 /* Expresses EXP as VAR + OFF, where off is a constant.  The type of OFF
 716    will be ssizetype.  */
 717
 718 void
 719 split_constant_offset (tree exp, tree *var, tree *off)
 720 {
 721   tree type = TREE_TYPE (exp), otype, op0, op1, e, o;
 722   enum tree_code code;
 723
 724   *var = exp;
 725   *off = ssize_int (0);
 726   STRIP_NOPS (exp);
 727
 728   if (tree_is_chrec (exp)
 729       || get_gimple_rhs_class (TREE_CODE (exp)) == GIMPLE_TERNARY_RHS)
 730     return;
 731
 732   otype = TREE_TYPE (exp);
 733   code = TREE_CODE (exp);
 734   extract_ops_from_tree (exp, &code, &op0, &op1);
 735   if (split_constant_offset_1 (otype, op0, code, op1, &e, &o))
 736     {
 737       *var = fold_convert (type, e);
 738       *off = o;
 739     }
 740 }
 741
 742 /* Returns the address ADDR of an object in a canonical shape (without nop
 743    casts, and with type of pointer to the object).  */
 744
 745 static tree
 746 canonicalize_base_object_address (tree addr)
 747 {
 748   tree orig = addr;
 749
 750   STRIP_NOPS (addr);
 751
 752   /* The base address may be obtained by casting from integer, in that case
 753      keep the cast.  */
 754   if (!POINTER_TYPE_P (TREE_TYPE (addr)))
 755     return orig;
 756
 757   if (TREE_CODE (addr) != ADDR_EXPR)
 758     return addr;
 759
 760   return build_fold_addr_expr (TREE_OPERAND (addr, 0));
 761 }
 762
 763 /* Analyzes the behavior of the memory reference DR in the innermost loop or
 764    basic block that contains it.  Returns true if analysis succeed or false
 765    otherwise.  */
 766
 767 bool
 768 dr_analyze_innermost (struct data_reference *dr, struct loop *nest)
 769 {
 770   gimple stmt = DR_STMT (dr);
 771   struct loop *loop = loop_containing_stmt (stmt);
 772   tree ref = DR_REF (dr);
 773   HOST_WIDE_INT pbitsize, pbitpos;
 774   tree base, poffset;
 775   machine_mode pmode;
 776   int punsignedp, pvolatilep;
 777   affine_iv base_iv, offset_iv;
 778   tree init, dinit, step;
 779   bool in_loop = (loop && loop->num);
 780
 781   if (dump_file && (dump_flags & TDF_DETAILS))
 782     fprintf (dump_file, "analyze_innermost: ");
 783
 784   base = get_inner_reference (ref, &pbitsize, &pbitpos, &poffset,
 785                               &pmode, &punsignedp, &pvolatilep, false);
 786   gcc_assert (base != NULL_TREE);
 787
 788   if (pbitpos % BITS_PER_UNIT != 0)
 789     {
 790       if (dump_file && (dump_flags & TDF_DETAILS))
 791         fprintf (dump_file, "failed: bit offset alignment.\n");
 792       return false;
 793     }
 794
 795   if (TREE_CODE (base) == MEM_REF)
 796     {
 797       if (!integer_zerop (TREE_OPERAND (base, 1)))
 798         {
 799           offset_int moff = mem_ref_offset (base);
 800           tree mofft = wide_int_to_tree (sizetype, moff);
 801           if (!poffset)
 802             poffset = mofft;
 803           else
 804             poffset = size_binop (PLUS_EXPR, poffset, mofft);
 805         }
 806       base = TREE_OPERAND (base, 0);
 807     }
 808   else
 809     base = build_fold_addr_expr (base);
 810
 811   if (in_loop)
 812     {
 813       if (!simple_iv (loop, loop_containing_stmt (stmt), base, &base_iv,
 814                       nest ? true : false))
 815         {
 816           if (nest)
 817             {
 818               if (dump_file && (dump_flags & TDF_DETAILS))
 819                 fprintf (dump_file, "failed: evolution of base is not"
 820                                     " affine.\n");
 821               return false;
 822             }
 823           else
 824             {
 825               base_iv.base = base;
 826               base_iv.step = ssize_int (0);
 827               base_iv.no_overflow = true;
 828             }
 829         }
 830     }
 831   else
 832     {
 833       base_iv.base = base;
 834       base_iv.step = ssize_int (0);
 835       base_iv.no_overflow = true;
 836     }
 837
 838   if (!poffset)
 839     {
 840       offset_iv.base = ssize_int (0);
 841       offset_iv.step = ssize_int (0);
 842     }
 843   else
 844     {
 845       if (!in_loop)
 846         {
 847           offset_iv.base = poffset;
 848           offset_iv.step = ssize_int (0);
 849         }
 850       else if (!simple_iv (loop, loop_containing_stmt (stmt),
 851                            poffset, &offset_iv,
 852                            nest ? true : false))
 853         {
 854           if (nest)
 855             {
 856               if (dump_file && (dump_flags & TDF_DETAILS))
 857                 fprintf (dump_file, "failed: evolution of offset is not"
 858                                     " affine.\n");
 859               return false;
 860             }
 861           else
 862             {
 863               offset_iv.base = poffset;
 864               offset_iv.step = ssize_int (0);
 865             }
 866         }
 867     }
 868
 869   init = ssize_int (pbitpos / BITS_PER_UNIT);
 870   split_constant_offset (base_iv.base, &base_iv.base, &dinit);
 871   init =  size_binop (PLUS_EXPR, init, dinit);
 872   split_constant_offset (offset_iv.base, &offset_iv.base, &dinit);
 873   init =  size_binop (PLUS_EXPR, init, dinit);
 874
 875   step = size_binop (PLUS_EXPR,
 876                      fold_convert (ssizetype, base_iv.step),
 877                      fold_convert (ssizetype, offset_iv.step));
 878
 879   DR_BASE_ADDRESS (dr) = canonicalize_base_object_address (base_iv.base);
 880
 881   DR_OFFSET (dr) = fold_convert (ssizetype, offset_iv.base);
 882   DR_INIT (dr) = init;
 883   DR_STEP (dr) = step;
 884
 885   DR_ALIGNED_TO (dr) = size_int (highest_pow2_factor (offset_iv.base));
 886
 887   if (dump_file && (dump_flags & TDF_DETAILS))
 888     fprintf (dump_file, "success.\n");
 889
 890   return true;
 891 }
 892
 893 /* Determines the base object and the list of indices of memory reference
 894    DR, analyzed in LOOP and instantiated in loop nest NEST.  */
 895
 896 static void
 897 dr_analyze_indices (struct data_reference *dr, loop_p nest, loop_p loop)
 898 {
 899   vec<tree> access_fns = vNULL;
 900   tree ref, op;
 901   tree base, off, access_fn;
 902   basic_block before_loop;
 903
 904   /* If analyzing a basic-block there are no indices to analyze
 905      and thus no access functions.  */
 906   if (!nest)
 907     {
 908       DR_BASE_OBJECT (dr) = DR_REF (dr);
 909       DR_ACCESS_FNS (dr).create (0);
 910       return;
 911     }
 912
 913   ref = DR_REF (dr);
 914   before_loop = block_before_loop (nest);
 915
 916   /* REALPART_EXPR and IMAGPART_EXPR can be handled like accesses
 917      into a two element array with a constant index.  The base is
 918      then just the immediate underlying object.  */
 919   if (TREE_CODE (ref) == REALPART_EXPR)
 920     {
 921       ref = TREE_OPERAND (ref, 0);
 922       access_fns.safe_push (integer_zero_node);
 923     }
 924   else if (TREE_CODE (ref) == IMAGPART_EXPR)
 925     {
 926       ref = TREE_OPERAND (ref, 0);
 927       access_fns.safe_push (integer_one_node);
 928     }
 929
 930   /* Analyze access functions of dimensions we know to be independent.  */
 931   while (handled_component_p (ref))
 932     {
 933       if (TREE_CODE (ref) == ARRAY_REF)
 934         {
 935           op = TREE_OPERAND (ref, 1);
 936           access_fn = analyze_scalar_evolution (loop, op);
 937           access_fn = instantiate_scev (before_loop, loop, access_fn);
 938           access_fns.safe_push (access_fn);
 939         }
 940       else if (TREE_CODE (ref) == COMPONENT_REF
 941                && TREE_CODE (TREE_TYPE (TREE_OPERAND (ref, 0))) == RECORD_TYPE)
 942         {
 943           /* For COMPONENT_REFs of records (but not unions!) use the
 944              FIELD_DECL offset as constant access function so we can
 945              disambiguate a[i].f1 and a[i].f2.  */
 946           tree off = component_ref_field_offset (ref);
 947           off = size_binop (PLUS_EXPR,
 948                             size_binop (MULT_EXPR,
 949                                         fold_convert (bitsizetype, off),
 950                                         bitsize_int (BITS_PER_UNIT)),
 951                             DECL_FIELD_BIT_OFFSET (TREE_OPERAND (ref, 1)));
 952           access_fns.safe_push (off);
 953         }
 954       else
 955         /* If we have an unhandled component we could not translate
 956            to an access function stop analyzing.  We have determined
 957            our base object in this case.  */
 958         break;
 959
 960       ref = TREE_OPERAND (ref, 0);
 961     }
 962
 963   /* If the address operand of a MEM_REF base has an evolution in the
 964      analyzed nest, add it as an additional independent access-function.  */
 965   if (TREE_CODE (ref) == MEM_REF)
 966     {
 967       op = TREE_OPERAND (ref, 0);
 968       access_fn = analyze_scalar_evolution (loop, op);
 969       access_fn = instantiate_scev (before_loop, loop, access_fn);
 970       if (TREE_CODE (access_fn) == POLYNOMIAL_CHREC)
 971         {
 972           tree orig_type;
 973           tree memoff = TREE_OPERAND (ref, 1);
 974           base = initial_condition (access_fn);
 975           orig_type = TREE_TYPE (base);
 976           STRIP_USELESS_TYPE_CONVERSION (base);
 977           split_constant_offset (base, &base, &off);
 978           STRIP_USELESS_TYPE_CONVERSION (base);
 979           /* Fold the MEM_REF offset into the evolutions initial
 980              value to make more bases comparable.  */
 981           if (!integer_zerop (memoff))
 982             {
 983               off = size_binop (PLUS_EXPR, off,
 984                                 fold_convert (ssizetype, memoff));
 985               memoff = build_int_cst (TREE_TYPE (memoff), 0);
 986             }
 987           /* Adjust the offset so it is a multiple of the access type
 988              size and thus we separate bases that can possibly be used
 989              to produce partial overlaps (which the access_fn machinery
 990              cannot handle).  */
 991           wide_int rem;
 992           if (TYPE_SIZE_UNIT (TREE_TYPE (ref))
 993               && TREE_CODE (TYPE_SIZE_UNIT (TREE_TYPE (ref))) == INTEGER_CST
 994               && !integer_zerop (TYPE_SIZE_UNIT (TREE_TYPE (ref))))
 995             rem = wi::mod_trunc (off, TYPE_SIZE_UNIT (TREE_TYPE (ref)), SIGNED);
 996           else
 997             /* If we can't compute the remainder simply force the initial
 998                condition to zero.  */
 999             rem = off;
1000           off = wide_int_to_tree (ssizetype, wi::sub (off, rem));
1001           memoff = wide_int_to_tree (TREE_TYPE (memoff), rem);
1002           /* And finally replace the initial condition.  */
1003           access_fn = chrec_replace_initial_condition
1004               (access_fn, fold_convert (orig_type, off));
1005           /* ???  This is still not a suitable base object for
1006              dr_may_alias_p - the base object needs to be an
1007              access that covers the object as whole.  With
1008              an evolution in the pointer this cannot be
1009              guaranteed.
1010              As a band-aid, mark the access so we can special-case
1011              it in dr_may_alias_p.  */
1012           tree old = ref;
1013           ref = fold_build2_loc (EXPR_LOCATION (ref),
1014                                  MEM_REF, TREE_TYPE (ref),
1015                                  base, memoff);
1016           MR_DEPENDENCE_CLIQUE (ref) = MR_DEPENDENCE_CLIQUE (old);
1017           MR_DEPENDENCE_BASE (ref) = MR_DEPENDENCE_BASE (old);
1018           DR_UNCONSTRAINED_BASE (dr) = true;
1019           access_fns.safe_push (access_fn);
1020         }
1021     }
1022   else if (DECL_P (ref))
1023     {
1024       /* Canonicalize DR_BASE_OBJECT to MEM_REF form.  */
1025       ref = build2 (MEM_REF, TREE_TYPE (ref),
1026                     build_fold_addr_expr (ref),
1027                     build_int_cst (reference_alias_ptr_type (ref), 0));
1028     }
1029
1030   DR_BASE_OBJECT (dr) = ref;
1031   DR_ACCESS_FNS (dr) = access_fns;
1032 }
1033
1034 /* Extracts the alias analysis information from the memory reference DR.  */
1035
1036 static void
1037 dr_analyze_alias (struct data_reference *dr)
1038 {
1039   tree ref = DR_REF (dr);
1040   tree base = get_base_address (ref), addr;
1041
1042   if (INDIRECT_REF_P (base)
1043       || TREE_CODE (base) == MEM_REF)
1044     {
1045       addr = TREE_OPERAND (base, 0);
1046       if (TREE_CODE (addr) == SSA_NAME)
1047         DR_PTR_INFO (dr) = SSA_NAME_PTR_INFO (addr);
1048     }
1049 }
1050
1051 /* Frees data reference DR.  */
1052
1053 void
1054 free_data_ref (data_reference_p dr)
1055 {
1056   DR_ACCESS_FNS (dr).release ();
1057   free (dr);
1058 }
1059
1060 /* Analyzes memory reference MEMREF accessed in STMT.  The reference
1061    is read if IS_READ is true, write otherwise.  Returns the
1062    data_reference description of MEMREF.  NEST is the outermost loop
1063    in which the reference should be instantiated, LOOP is the loop in
1064    which the data reference should be analyzed.  */
1065
1066 struct data_reference *
1067 create_data_ref (loop_p nest, loop_p loop, tree memref, gimple stmt,
1068                  bool is_read)
1069 {
1070   struct data_reference *dr;
1071
1072   if (dump_file && (dump_flags & TDF_DETAILS))
1073     {
1074       fprintf (dump_file, "Creating dr for ");
1075       print_generic_expr (dump_file, memref, TDF_SLIM);
1076       fprintf (dump_file, "\n");
1077     }
1078
1079   dr = XCNEW (struct data_reference);
1080   DR_STMT (dr) = stmt;
1081   DR_REF (dr) = memref;
1082   DR_IS_READ (dr) = is_read;
1083
1084   dr_analyze_innermost (dr, nest);
1085   dr_analyze_indices (dr, nest, loop);
1086   dr_analyze_alias (dr);
1087
1088   if (dump_file && (dump_flags & TDF_DETAILS))
1089     {
1090       unsigned i;
1091       fprintf (dump_file, "\tbase_address: ");
1092       print_generic_expr (dump_file, DR_BASE_ADDRESS (dr), TDF_SLIM);
1093       fprintf (dump_file, "\n\toffset from base address: ");
1094       print_generic_expr (dump_file, DR_OFFSET (dr), TDF_SLIM);
1095       fprintf (dump_file, "\n\tconstant offset from base address: ");
1096       print_generic_expr (dump_file, DR_INIT (dr), TDF_SLIM);
1097       fprintf (dump_file, "\n\tstep: ");
1098       print_generic_expr (dump_file, DR_STEP (dr), TDF_SLIM);
1099       fprintf (dump_file, "\n\taligned to: ");
1100       print_generic_expr (dump_file, DR_ALIGNED_TO (dr), TDF_SLIM);
1101       fprintf (dump_file, "\n\tbase_object: ");
1102       print_generic_expr (dump_file, DR_BASE_OBJECT (dr), TDF_SLIM);
1103       fprintf (dump_file, "\n");
1104       for (i = 0; i < DR_NUM_DIMENSIONS (dr); i++)
1105         {
1106           fprintf (dump_file, "\tAccess function %d: ", i);
1107           print_generic_stmt (dump_file, DR_ACCESS_FN (dr, i), TDF_SLIM);
1108         }
1109     }
1110
1111   return dr;
1112 }
1113
1114 /* Check if OFFSET1 and OFFSET2 (DR_OFFSETs of some data-refs) are identical
1115    expressions.  */
1116 static bool
1117 dr_equal_offsets_p1 (tree offset1, tree offset2)
1118 {
1119   bool res;
1120
1121   STRIP_NOPS (offset1);
1122   STRIP_NOPS (offset2);
1123
1124   if (offset1 == offset2)
1125     return true;
1126
1127   if (TREE_CODE (offset1) != TREE_CODE (offset2)
1128       || (!BINARY_CLASS_P (offset1) && !UNARY_CLASS_P (offset1)))
1129     return false;
1130
1131   res = dr_equal_offsets_p1 (TREE_OPERAND (offset1, 0),
1132                              TREE_OPERAND (offset2, 0));
1133
1134   if (!res || !BINARY_CLASS_P (offset1))
1135     return res;
1136
1137   res = dr_equal_offsets_p1 (TREE_OPERAND (offset1, 1),
1138                              TREE_OPERAND (offset2, 1));
1139
1140   return res;
1141 }
1142
1143 /* Check if DRA and DRB have equal offsets.  */
1144 bool
1145 dr_equal_offsets_p (struct data_reference *dra,
1146                     struct data_reference *drb)
1147 {
1148   tree offset1, offset2;
1149
1150   offset1 = DR_OFFSET (dra);
1151   offset2 = DR_OFFSET (drb);
1152
1153   return dr_equal_offsets_p1 (offset1, offset2);
1154 }
1155
1156 /* Returns true if FNA == FNB.  */
1157
1158 static bool
1159 affine_function_equal_p (affine_fn fna, affine_fn fnb)
1160 {
1161   unsigned i, n = fna.length ();
1162
1163   if (n != fnb.length ())
1164     return false;
1165
1166   for (i = 0; i < n; i++)
1167     if (!operand_equal_p (fna[i], fnb[i], 0))
1168       return false;
1169
1170   return true;
1171 }
1172
1173 /* If all the functions in CF are the same, returns one of them,
1174    otherwise returns NULL.  */
1175
1176 static affine_fn
1177 common_affine_function (conflict_function *cf)
1178 {
1179   unsigned i;
1180   affine_fn comm;
1181
1182   if (!CF_NONTRIVIAL_P (cf))
1183     return affine_fn ();
1184
1185   comm = cf->fns[0];
1186
1187   for (i = 1; i < cf->n; i++)
1188     if (!affine_function_equal_p (comm, cf->fns[i]))
1189       return affine_fn ();
1190
1191   return comm;
1192 }
1193
1194 /* Returns the base of the affine function FN.  */
1195
1196 static tree
1197 affine_function_base (affine_fn fn)
1198 {
1199   return fn[0];
1200 }
1201
1202 /* Returns true if FN is a constant.  */
1203
1204 static bool
1205 affine_function_constant_p (affine_fn fn)
1206 {
1207   unsigned i;
1208   tree coef;
1209
1210   for (i = 1; fn.iterate (i, &coef); i++)
1211     if (!integer_zerop (coef))
1212       return false;
1213
1214   return true;
1215 }
1216
1217 /* Returns true if FN is the zero constant function.  */
1218
1219 static bool
1220 affine_function_zero_p (affine_fn fn)
1221 {
1222   return (integer_zerop (affine_function_base (fn))
1223           && affine_function_constant_p (fn));
1224 }
1225
1226 /* Returns a signed integer type with the largest precision from TA
1227    and TB.  */
1228
1229 static tree
1230 signed_type_for_types (tree ta, tree tb)
1231 {
1232   if (TYPE_PRECISION (ta) > TYPE_PRECISION (tb))
1233     return signed_type_for (ta);
1234   else
1235     return signed_type_for (tb);
1236 }
1237
1238 /* Applies operation OP on affine functions FNA and FNB, and returns the
1239    result.  */
1240
1241 static affine_fn
1242 affine_fn_op (enum tree_code op, affine_fn fna, affine_fn fnb)
1243 {
1244   unsigned i, n, m;
1245   affine_fn ret;
1246   tree coef;
1247
1248   if (fnb.length () > fna.length ())
1249     {
1250       n = fna.length ();
1251       m = fnb.length ();
1252     }
1253   else
1254     {
1255       n = fnb.length ();
1256       m = fna.length ();
1257     }
1258
1259   ret.create (m);
1260   for (i = 0; i < n; i++)
1261     {
1262       tree type = signed_type_for_types (TREE_TYPE (fna[i]),
1263                                          TREE_TYPE (fnb[i]));
1264       ret.quick_push (fold_build2 (op, type, fna[i], fnb[i]));
1265     }
1266
1267   for (; fna.iterate (i, &coef); i++)
1268     ret.quick_push (fold_build2 (op, signed_type_for (TREE_TYPE (coef)),
1269                                  coef, integer_zero_node));
1270   for (; fnb.iterate (i, &coef); i++)
1271     ret.quick_push (fold_build2 (op, signed_type_for (TREE_TYPE (coef)),
1272                                  integer_zero_node, coef));
1273
1274   return ret;
1275 }
1276
1277 /* Returns the sum of affine functions FNA and FNB.  */
1278
1279 static affine_fn
1280 affine_fn_plus (affine_fn fna, affine_fn fnb)
1281 {
1282   return affine_fn_op (PLUS_EXPR, fna, fnb);
1283 }
1284
1285 /* Returns the difference of affine functions FNA and FNB.  */
1286
1287 static affine_fn
1288 affine_fn_minus (affine_fn fna, affine_fn fnb)
1289 {
1290   return affine_fn_op (MINUS_EXPR, fna, fnb);
1291 }
1292
1293 /* Frees affine function FN.  */
1294
1295 static void
1296 affine_fn_free (affine_fn fn)
1297 {
1298   fn.release ();
1299 }
1300
1301 /* Determine for each subscript in the data dependence relation DDR
1302    the distance.  */
1303
1304 static void
1305 compute_subscript_distance (struct data_dependence_relation *ddr)
1306 {
1307   conflict_function *cf_a, *cf_b;
1308   affine_fn fn_a, fn_b, diff;
1309
1310   if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
1311     {
1312       unsigned int i;
1313
1314       for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
1315         {
1316           struct subscript *subscript;
1317
1318           subscript = DDR_SUBSCRIPT (ddr, i);
1319           cf_a = SUB_CONFLICTS_IN_A (subscript);
1320           cf_b = SUB_CONFLICTS_IN_B (subscript);
1321
1322           fn_a = common_affine_function (cf_a);
1323           fn_b = common_affine_function (cf_b);
1324           if (!fn_a.exists () || !fn_b.exists ())
1325             {
1326               SUB_DISTANCE (subscript) = chrec_dont_know;
1327               return;
1328             }
1329           diff = affine_fn_minus (fn_a, fn_b);
1330
1331           if (affine_function_constant_p (diff))
1332             SUB_DISTANCE (subscript) = affine_function_base (diff);
1333           else
1334             SUB_DISTANCE (subscript) = chrec_dont_know;
1335
1336           affine_fn_free (diff);
1337         }
1338     }
1339 }
1340
1341 /* Returns the conflict function for "unknown".  */
1342
1343 static conflict_function *
1344 conflict_fn_not_known (void)
1345 {
1346   conflict_function *fn = XCNEW (conflict_function);
1347   fn->n = NOT_KNOWN;
1348
1349   return fn;
1350 }
1351
1352 /* Returns the conflict function for "independent".  */
1353
1354 static conflict_function *
1355 conflict_fn_no_dependence (void)
1356 {
1357   conflict_function *fn = XCNEW (conflict_function);
1358   fn->n = NO_DEPENDENCE;
1359
1360   return fn;
1361 }
1362
1363 /* Returns true if the address of OBJ is invariant in LOOP.  */
1364
1365 static bool
1366 object_address_invariant_in_loop_p (const struct loop *loop, const_tree obj)
1367 {
1368   while (handled_component_p (obj))
1369     {
1370       if (TREE_CODE (obj) == ARRAY_REF)
1371         {
1372           /* Index of the ARRAY_REF was zeroed in analyze_indices, thus we only
1373              need to check the stride and the lower bound of the reference.  */
1374           if (chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 2),
1375                                                       loop->num)
1376               || chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 3),
1377                                                          loop->num))
1378             return false;
1379         }
1380       else if (TREE_CODE (obj) == COMPONENT_REF)
1381         {
1382           if (chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 2),
1383                                                       loop->num))
1384             return false;
1385         }
1386       obj = TREE_OPERAND (obj, 0);
1387     }
1388
1389   if (!INDIRECT_REF_P (obj)
1390       && TREE_CODE (obj) != MEM_REF)
1391     return true;
1392
1393   return !chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 0),
1394                                                   loop->num);
1395 }
1396
1397 /* Returns false if we can prove that data references A and B do not alias,
1398    true otherwise.  If LOOP_NEST is false no cross-iteration aliases are
1399    considered.  */
1400
1401 bool
1402 dr_may_alias_p (const struct data_reference *a, const struct data_reference *b,
1403                 bool loop_nest)
1404 {
1405   tree addr_a = DR_BASE_OBJECT (a);
1406   tree addr_b = DR_BASE_OBJECT (b);
1407
1408   /* If we are not processing a loop nest but scalar code we
1409      do not need to care about possible cross-iteration dependences
1410      and thus can process the full original reference.  Do so,
1411      similar to how loop invariant motion applies extra offset-based
1412      disambiguation.  */
1413   if (!loop_nest)
1414     {
1415       aff_tree off1, off2;
1416       widest_int size1, size2;
1417       get_inner_reference_aff (DR_REF (a), &off1, &size1);
1418       get_inner_reference_aff (DR_REF (b), &off2, &size2);
1419       aff_combination_scale (&off1, -1);
1420       aff_combination_add (&off2, &off1);
1421       if (aff_comb_cannot_overlap_p (&off2, size1, size2))
1422         return false;
1423     }
1424
1425   if ((TREE_CODE (addr_a) == MEM_REF || TREE_CODE (addr_a) == TARGET_MEM_REF)
1426       && (TREE_CODE (addr_b) == MEM_REF || TREE_CODE (addr_b) == TARGET_MEM_REF)
1427       && MR_DEPENDENCE_CLIQUE (addr_a) == MR_DEPENDENCE_CLIQUE (addr_b)
1428       && MR_DEPENDENCE_BASE (addr_a) != MR_DEPENDENCE_BASE (addr_b))
1429     return false;
1430
1431   /* If we had an evolution in a pointer-based MEM_REF BASE_OBJECT we
1432      do not know the size of the base-object.  So we cannot do any
1433      offset/overlap based analysis but have to rely on points-to
1434      information only.  */
1435   if (TREE_CODE (addr_a) == MEM_REF
1436       && (DR_UNCONSTRAINED_BASE (a)
1437           || TREE_CODE (TREE_OPERAND (addr_a, 0)) == SSA_NAME))
1438     {
1439       /* For true dependences we can apply TBAA.  */
1440       if (flag_strict_aliasing
1441           && DR_IS_WRITE (a) && DR_IS_READ (b)
1442           && !alias_sets_conflict_p (get_alias_set (DR_REF (a)),
1443                                      get_alias_set (DR_REF (b))))
1444         return false;
1445       if (TREE_CODE (addr_b) == MEM_REF)
1446         return ptr_derefs_may_alias_p (TREE_OPERAND (addr_a, 0),
1447                                        TREE_OPERAND (addr_b, 0));
1448       else
1449         return ptr_derefs_may_alias_p (TREE_OPERAND (addr_a, 0),
1450                                        build_fold_addr_expr (addr_b));
1451     }
1452   else if (TREE_CODE (addr_b) == MEM_REF
1453            && (DR_UNCONSTRAINED_BASE (b)
1454                || TREE_CODE (TREE_OPERAND (addr_b, 0)) == SSA_NAME))
1455     {
1456       /* For true dependences we can apply TBAA.  */
1457       if (flag_strict_aliasing
1458           && DR_IS_WRITE (a) && DR_IS_READ (b)
1459           && !alias_sets_conflict_p (get_alias_set (DR_REF (a)),
1460                                      get_alias_set (DR_REF (b))))
1461         return false;
1462       if (TREE_CODE (addr_a) == MEM_REF)
1463         return ptr_derefs_may_alias_p (TREE_OPERAND (addr_a, 0),
1464                                        TREE_OPERAND (addr_b, 0));
1465       else
1466         return ptr_derefs_may_alias_p (build_fold_addr_expr (addr_a),
1467                                        TREE_OPERAND (addr_b, 0));
1468     }
1469
1470   /* Otherwise DR_BASE_OBJECT is an access that covers the whole object
1471      that is being subsetted in the loop nest.  */
1472   if (DR_IS_WRITE (a) && DR_IS_WRITE (b))
1473     return refs_output_dependent_p (addr_a, addr_b);
1474   else if (DR_IS_READ (a) && DR_IS_WRITE (b))
1475     return refs_anti_dependent_p (addr_a, addr_b);
1476   return refs_may_alias_p (addr_a, addr_b);
1477 }
1478
1479 /* Initialize a data dependence relation between data accesses A and
1480    B.  NB_LOOPS is the number of loops surrounding the references: the
1481    size of the classic distance/direction vectors.  */
1482
1483 struct data_dependence_relation *
1484 initialize_data_dependence_relation (struct data_reference *a,
1485                                      struct data_reference *b,
1486                                      vec<loop_p> loop_nest)
1487 {
1488   struct data_dependence_relation *res;
1489   unsigned int i;
1490
1491   res = XNEW (struct data_dependence_relation);
1492   DDR_A (res) = a;
1493   DDR_B (res) = b;
1494   DDR_LOOP_NEST (res).create (0);
1495   DDR_REVERSED_P (res) = false;
1496   DDR_SUBSCRIPTS (res).create (0);
1497   DDR_DIR_VECTS (res).create (0);
1498   DDR_DIST_VECTS (res).create (0);
1499
1500   if (a == NULL || b == NULL)
1501     {
1502       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1503       return res;
1504     }
1505
1506   /* If the data references do not alias, then they are independent.  */
1507   if (!dr_may_alias_p (a, b, loop_nest.exists ()))
1508     {
1509       DDR_ARE_DEPENDENT (res) = chrec_known;
1510       return res;
1511     }
1512
1513   /* The case where the references are exactly the same.  */
1514   if (operand_equal_p (DR_REF (a), DR_REF (b), 0))
1515     {
1516      if (loop_nest.exists ()
1517         && !object_address_invariant_in_loop_p (loop_nest[0],
1518                                                 DR_BASE_OBJECT (a)))
1519       {
1520         DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1521         return res;
1522       }
1523       DDR_AFFINE_P (res) = true;
1524       DDR_ARE_DEPENDENT (res) = NULL_TREE;
1525       DDR_SUBSCRIPTS (res).create (DR_NUM_DIMENSIONS (a));
1526       DDR_LOOP_NEST (res) = loop_nest;
1527       DDR_INNER_LOOP (res) = 0;
1528       DDR_SELF_REFERENCE (res) = true;
1529       for (i = 0; i < DR_NUM_DIMENSIONS (a); i++)
1530        {
1531          struct subscript *subscript;
1532
1533          subscript = XNEW (struct subscript);
1534          SUB_CONFLICTS_IN_A (subscript) = conflict_fn_not_known ();
1535          SUB_CONFLICTS_IN_B (subscript) = conflict_fn_not_known ();
1536          SUB_LAST_CONFLICT (subscript) = chrec_dont_know;
1537          SUB_DISTANCE (subscript) = chrec_dont_know;
1538          DDR_SUBSCRIPTS (res).safe_push (subscript);
1539        }
1540       return res;
1541     }
1542
1543   /* If the references do not access the same object, we do not know
1544      whether they alias or not.  */
1545   if (!operand_equal_p (DR_BASE_OBJECT (a), DR_BASE_OBJECT (b), 0))
1546     {
1547       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1548       return res;
1549     }
1550
1551   /* If the base of the object is not invariant in the loop nest, we cannot
1552      analyze it.  TODO -- in fact, it would suffice to record that there may
1553      be arbitrary dependences in the loops where the base object varies.  */
1554   if (loop_nest.exists ()
1555       && !object_address_invariant_in_loop_p (loop_nest[0],
1556                                               DR_BASE_OBJECT (a)))
1557     {
1558       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1559       return res;
1560     }
1561
1562   /* If the number of dimensions of the access to not agree we can have
1563      a pointer access to a component of the array element type and an
1564      array access while the base-objects are still the same.  Punt.  */
1565   if (DR_NUM_DIMENSIONS (a) != DR_NUM_DIMENSIONS (b))
1566     {
1567       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1568       return res;
1569     }
1570
1571   DDR_AFFINE_P (res) = true;
1572   DDR_ARE_DEPENDENT (res) = NULL_TREE;
1573   DDR_SUBSCRIPTS (res).create (DR_NUM_DIMENSIONS (a));
1574   DDR_LOOP_NEST (res) = loop_nest;
1575   DDR_INNER_LOOP (res) = 0;
1576   DDR_SELF_REFERENCE (res) = false;
1577
1578   for (i = 0; i < DR_NUM_DIMENSIONS (a); i++)
1579     {
1580       struct subscript *subscript;
1581
1582       subscript = XNEW (struct subscript);
1583       SUB_CONFLICTS_IN_A (subscript) = conflict_fn_not_known ();
1584       SUB_CONFLICTS_IN_B (subscript) = conflict_fn_not_known ();
1585       SUB_LAST_CONFLICT (subscript) = chrec_dont_know;
1586       SUB_DISTANCE (subscript) = chrec_dont_know;
1587       DDR_SUBSCRIPTS (res).safe_push (subscript);
1588     }
1589
1590   return res;
1591 }
1592
1593 /* Frees memory used by the conflict function F.  */
1594
1595 static void
1596 free_conflict_function (conflict_function *f)
1597 {
1598   unsigned i;
1599
1600   if (CF_NONTRIVIAL_P (f))
1601     {
1602       for (i = 0; i < f->n; i++)
1603         affine_fn_free (f->fns[i]);
1604     }
1605   free (f);
1606 }
1607
1608 /* Frees memory used by SUBSCRIPTS.  */
1609
1610 static void
1611 free_subscripts (vec<subscript_p> subscripts)
1612 {
1613   unsigned i;
1614   subscript_p s;
1615
1616   FOR_EACH_VEC_ELT (subscripts, i, s)
1617     {
1618       free_conflict_function (s->conflicting_iterations_in_a);
1619       free_conflict_function (s->conflicting_iterations_in_b);
1620       free (s);
1621     }
1622   subscripts.release ();
1623 }
1624
1625 /* Set DDR_ARE_DEPENDENT to CHREC and finalize the subscript overlap
1626    description.  */
1627
1628 static inline void
1629 finalize_ddr_dependent (struct data_dependence_relation *ddr,
1630                         tree chrec)
1631 {
1632   DDR_ARE_DEPENDENT (ddr) = chrec;
1633   free_subscripts (DDR_SUBSCRIPTS (ddr));
1634   DDR_SUBSCRIPTS (ddr).create (0);
1635 }
1636
1637 /* The dependence relation DDR cannot be represented by a distance
1638    vector.  */
1639
1640 static inline void
1641 non_affine_dependence_relation (struct data_dependence_relation *ddr)
1642 {
1643   if (dump_file && (dump_flags & TDF_DETAILS))
1644     fprintf (dump_file, "(Dependence relation cannot be represented by distance vector.) \n");
1645
1646   DDR_AFFINE_P (ddr) = false;
1647 }
1648
1649 \f
1650
1651 /* This section contains the classic Banerjee tests.  */
1652
1653 /* Returns true iff CHREC_A and CHREC_B are not dependent on any index
1654    variables, i.e., if the ZIV (Zero Index Variable) test is true.  */
1655
1656 static inline bool
1657 ziv_subscript_p (const_tree chrec_a, const_tree chrec_b)
1658 {
1659   return (evolution_function_is_constant_p (chrec_a)
1660           && evolution_function_is_constant_p (chrec_b));
1661 }
1662
1663 /* Returns true iff CHREC_A and CHREC_B are dependent on an index
1664    variable, i.e., if the SIV (Single Index Variable) test is true.  */
1665
1666 static bool
1667 siv_subscript_p (const_tree chrec_a, const_tree chrec_b)
1668 {
1669   if ((evolution_function_is_constant_p (chrec_a)
1670        && evolution_function_is_univariate_p (chrec_b))
1671       || (evolution_function_is_constant_p (chrec_b)
1672           && evolution_function_is_univariate_p (chrec_a)))
1673     return true;
1674
1675   if (evolution_function_is_univariate_p (chrec_a)
1676       && evolution_function_is_univariate_p (chrec_b))
1677     {
1678       switch (TREE_CODE (chrec_a))
1679         {
1680         case POLYNOMIAL_CHREC:
1681           switch (TREE_CODE (chrec_b))
1682             {
1683             case POLYNOMIAL_CHREC:
1684               if (CHREC_VARIABLE (chrec_a) != CHREC_VARIABLE (chrec_b))
1685                 return false;
1686
1687             default:
1688               return true;
1689             }
1690
1691         default:
1692           return true;
1693         }
1694     }
1695
1696   return false;
1697 }
1698
1699 /* Creates a conflict function with N dimensions.  The affine functions
1700    in each dimension follow.  */
1701
1702 static conflict_function *
1703 conflict_fn (unsigned n, ...)
1704 {
1705   unsigned i;
1706   conflict_function *ret = XCNEW (conflict_function);
1707   va_list ap;
1708
1709   gcc_assert (0 < n && n <= MAX_DIM);
1710   va_start (ap, n);
1711
1712   ret->n = n;
1713   for (i = 0; i < n; i++)
1714     ret->fns[i] = va_arg (ap, affine_fn);
1715   va_end (ap);
1716
1717   return ret;
1718 }
1719
1720 /* Returns constant affine function with value CST.  */
1721
1722 static affine_fn
1723 affine_fn_cst (tree cst)
1724 {
1725   affine_fn fn;
1726   fn.create (1);
1727   fn.quick_push (cst);
1728   return fn;
1729 }
1730
1731 /* Returns affine function with single variable, CST + COEF * x_DIM.  */
1732
1733 static affine_fn
1734 affine_fn_univar (tree cst, unsigned dim, tree coef)
1735 {
1736   affine_fn fn;
1737   fn.create (dim + 1);
1738   unsigned i;
1739
1740   gcc_assert (dim > 0);
1741   fn.quick_push (cst);
1742   for (i = 1; i < dim; i++)
1743     fn.quick_push (integer_zero_node);
1744   fn.quick_push (coef);
1745   return fn;
1746 }
1747
1748 /* Analyze a ZIV (Zero Index Variable) subscript.  *OVERLAPS_A and
1749    *OVERLAPS_B are initialized to the functions that describe the
1750    relation between the elements accessed twice by CHREC_A and
1751    CHREC_B.  For k >= 0, the following property is verified:
1752
1753    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
1754
1755 static void
1756 analyze_ziv_subscript (tree chrec_a,
1757                        tree chrec_b,
1758                        conflict_function **overlaps_a,
1759                        conflict_function **overlaps_b,
1760                        tree *last_conflicts)
1761 {
1762   tree type, difference;
1763   dependence_stats.num_ziv++;
1764
1765   if (dump_file && (dump_flags & TDF_DETAILS))
1766     fprintf (dump_file, "(analyze_ziv_subscript \n");
1767
1768   type = signed_type_for_types (TREE_TYPE (chrec_a), TREE_TYPE (chrec_b));
1769   chrec_a = chrec_convert (type, chrec_a, NULL);
1770   chrec_b = chrec_convert (type, chrec_b, NULL);
1771   difference = chrec_fold_minus (type, chrec_a, chrec_b);
1772
1773   switch (TREE_CODE (difference))
1774     {
1775     case INTEGER_CST:
1776       if (integer_zerop (difference))
1777         {
1778           /* The difference is equal to zero: the accessed index
1779              overlaps for each iteration in the loop.  */
1780           *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1781           *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
1782           *last_conflicts = chrec_dont_know;
1783           dependence_stats.num_ziv_dependent++;
1784         }
1785       else
1786         {
1787           /* The accesses do not overlap.  */
1788           *overlaps_a = conflict_fn_no_dependence ();
1789           *overlaps_b = conflict_fn_no_dependence ();
1790           *last_conflicts = integer_zero_node;
1791           dependence_stats.num_ziv_independent++;
1792         }
1793       break;
1794
1795     default:
1796       /* We're not sure whether the indexes overlap.  For the moment,
1797          conservatively answer "don't know".  */
1798       if (dump_file && (dump_flags & TDF_DETAILS))
1799         fprintf (dump_file, "ziv test failed: difference is non-integer.\n");
1800
1801       *overlaps_a = conflict_fn_not_known ();
1802       *overlaps_b = conflict_fn_not_known ();
1803       *last_conflicts = chrec_dont_know;
1804       dependence_stats.num_ziv_unimplemented++;
1805       break;
1806     }
1807
1808   if (dump_file && (dump_flags & TDF_DETAILS))
1809     fprintf (dump_file, ")\n");
1810 }
1811
1812 /* Similar to max_stmt_executions_int, but returns the bound as a tree,
1813    and only if it fits to the int type.  If this is not the case, or the
1814    bound  on the number of iterations of LOOP could not be derived, returns
1815    chrec_dont_know.  */
1816
1817 static tree
1818 max_stmt_executions_tree (struct loop *loop)
1819 {
1820   widest_int nit;
1821
1822   if (!max_stmt_executions (loop, &nit))
1823     return chrec_dont_know;
1824
1825   if (!wi::fits_to_tree_p (nit, unsigned_type_node))
1826     return chrec_dont_know;
1827
1828   return wide_int_to_tree (unsigned_type_node, nit);
1829 }
1830
1831 /* Determine whether the CHREC is always positive/negative.  If the expression
1832    cannot be statically analyzed, return false, otherwise set the answer into
1833    VALUE.  */
1834
1835 static bool
1836 chrec_is_positive (tree chrec, bool *value)
1837 {
1838   bool value0, value1, value2;
1839   tree end_value, nb_iter;
1840
1841   switch (TREE_CODE (chrec))
1842     {
1843     case POLYNOMIAL_CHREC:
1844       if (!chrec_is_positive (CHREC_LEFT (chrec), &value0)
1845           || !chrec_is_positive (CHREC_RIGHT (chrec), &value1))
1846         return false;
1847
1848       /* FIXME -- overflows.  */
1849       if (value0 == value1)
1850         {
1851           *value = value0;
1852           return true;
1853         }
1854
1855       /* Otherwise the chrec is under the form: "{-197, +, 2}_1",
1856          and the proof consists in showing that the sign never
1857          changes during the execution of the loop, from 0 to
1858          loop->nb_iterations.  */
1859       if (!evolution_function_is_affine_p (chrec))
1860         return false;
1861
1862       nb_iter = number_of_latch_executions (get_chrec_loop (chrec));
1863       if (chrec_contains_undetermined (nb_iter))
1864         return false;
1865
1866 #if 0
1867       /* TODO -- If the test is after the exit, we may decrease the number of
1868          iterations by one.  */
1869       if (after_exit)
1870         nb_iter = chrec_fold_minus (type, nb_iter, build_int_cst (type, 1));
1871 #endif
1872
1873       end_value = chrec_apply (CHREC_VARIABLE (chrec), chrec, nb_iter);
1874
1875       if (!chrec_is_positive (end_value, &value2))
1876         return false;
1877
1878       *value = value0;
1879       return value0 == value1;
1880
1881     case INTEGER_CST:
1882       switch (tree_int_cst_sgn (chrec))
1883         {
1884         case -1:
1885           *value = false;
1886           break;
1887         case 1:
1888           *value = true;
1889           break;
1890         default:
1891           return false;
1892         }
1893       return true;
1894
1895     default:
1896       return false;
1897     }
1898 }
1899
1900
1901 /* Analyze a SIV (Single Index Variable) subscript where CHREC_A is a
1902    constant, and CHREC_B is an affine function.  *OVERLAPS_A and
1903    *OVERLAPS_B are initialized to the functions that describe the
1904    relation between the elements accessed twice by CHREC_A and
1905    CHREC_B.  For k >= 0, the following property is verified:
1906
1907    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
1908
1909 static void
1910 analyze_siv_subscript_cst_affine (tree chrec_a,
1911                                   tree chrec_b,
1912                                   conflict_function **overlaps_a,
1913                                   conflict_function **overlaps_b,
1914                                   tree *last_conflicts)
1915 {
1916   bool value0, value1, value2;
1917   tree type, difference, tmp;
1918
1919   type = signed_type_for_types (TREE_TYPE (chrec_a), TREE_TYPE (chrec_b));
1920   chrec_a = chrec_convert (type, chrec_a, NULL);
1921   chrec_b = chrec_convert (type, chrec_b, NULL);
1922   difference = chrec_fold_minus (type, initial_condition (chrec_b), chrec_a);
1923
1924   /* Special case overlap in the first iteration.  */
1925   if (integer_zerop (difference))
1926     {
1927       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1928       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
1929       *last_conflicts = integer_one_node;
1930       return;
1931     }
1932
1933   if (!chrec_is_positive (initial_condition (difference), &value0))
1934     {
1935       if (dump_file && (dump_flags & TDF_DETAILS))
1936         fprintf (dump_file, "siv test failed: chrec is not positive.\n");
1937
1938       dependence_stats.num_siv_unimplemented++;
1939       *overlaps_a = conflict_fn_not_known ();
1940       *overlaps_b = conflict_fn_not_known ();
1941       *last_conflicts = chrec_dont_know;
1942       return;
1943     }
1944   else
1945     {
1946       if (value0 == false)
1947         {
1948           if (!chrec_is_positive (CHREC_RIGHT (chrec_b), &value1))
1949             {
1950               if (dump_file && (dump_flags & TDF_DETAILS))
1951                 fprintf (dump_file, "siv test failed: chrec not positive.\n");
1952
1953               *overlaps_a = conflict_fn_not_known ();
1954               *overlaps_b = conflict_fn_not_known ();
1955               *last_conflicts = chrec_dont_know;
1956               dependence_stats.num_siv_unimplemented++;
1957               return;
1958             }
1959           else
1960             {
1961               if (value1 == true)
1962                 {
1963                   /* Example:
1964                      chrec_a = 12
1965                      chrec_b = {10, +, 1}
1966                   */
1967
1968                   if (tree_fold_divides_p (CHREC_RIGHT (chrec_b), difference))
1969                     {
1970                       HOST_WIDE_INT numiter;
1971                       struct loop *loop = get_chrec_loop (chrec_b);
1972
1973                       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1974                       tmp = fold_build2 (EXACT_DIV_EXPR, type,
1975                                          fold_build1 (ABS_EXPR, type, difference),
1976                                          CHREC_RIGHT (chrec_b));
1977                       *overlaps_b = conflict_fn (1, affine_fn_cst (tmp));
1978                       *last_conflicts = integer_one_node;
1979
1980
1981                       /* Perform weak-zero siv test to see if overlap is
1982                          outside the loop bounds.  */
1983                       numiter = max_stmt_executions_int (loop);
1984
1985                       if (numiter >= 0
1986                           && compare_tree_int (tmp, numiter) > 0)
1987                         {
1988                           free_conflict_function (*overlaps_a);
1989                           free_conflict_function (*overlaps_b);
1990                           *overlaps_a = conflict_fn_no_dependence ();
1991                           *overlaps_b = conflict_fn_no_dependence ();
1992                           *last_conflicts = integer_zero_node;
1993                           dependence_stats.num_siv_independent++;
1994                           return;
1995                         }
1996                       dependence_stats.num_siv_dependent++;
1997                       return;
1998                     }
1999
2000                   /* When the step does not divide the difference, there are
2001                      no overlaps.  */
2002                   else
2003                     {
2004                       *overlaps_a = conflict_fn_no_dependence ();
2005                       *overlaps_b = conflict_fn_no_dependence ();
2006                       *last_conflicts = integer_zero_node;
2007                       dependence_stats.num_siv_independent++;
2008                       return;
2009                     }
2010                 }
2011
2012               else
2013                 {
2014                   /* Example:
2015                      chrec_a = 12
2016                      chrec_b = {10, +, -1}
2017
2018                      In this case, chrec_a will not overlap with chrec_b.  */
2019                   *overlaps_a = conflict_fn_no_dependence ();
2020                   *overlaps_b = conflict_fn_no_dependence ();
2021                   *last_conflicts = integer_zero_node;
2022                   dependence_stats.num_siv_independent++;
2023                   return;
2024                 }
2025             }
2026         }
2027       else
2028         {
2029           if (!chrec_is_positive (CHREC_RIGHT (chrec_b), &value2))
2030             {
2031               if (dump_file && (dump_flags & TDF_DETAILS))
2032                 fprintf (dump_file, "siv test failed: chrec not positive.\n");
2033
2034               *overlaps_a = conflict_fn_not_known ();
2035               *overlaps_b = conflict_fn_not_known ();
2036               *last_conflicts = chrec_dont_know;
2037               dependence_stats.num_siv_unimplemented++;
2038               return;
2039             }
2040           else
2041             {
2042               if (value2 == false)
2043                 {
2044                   /* Example:
2045                      chrec_a = 3
2046                      chrec_b = {10, +, -1}
2047                   */
2048                   if (tree_fold_divides_p (CHREC_RIGHT (chrec_b), difference))
2049                     {
2050                       HOST_WIDE_INT numiter;
2051                       struct loop *loop = get_chrec_loop (chrec_b);
2052
2053                       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2054                       tmp = fold_build2 (EXACT_DIV_EXPR, type, difference,
2055                                          CHREC_RIGHT (chrec_b));
2056                       *overlaps_b = conflict_fn (1, affine_fn_cst (tmp));
2057                       *last_conflicts = integer_one_node;
2058
2059                       /* Perform weak-zero siv test to see if overlap is
2060                          outside the loop bounds.  */
2061                       numiter = max_stmt_executions_int (loop);
2062
2063                       if (numiter >= 0
2064                           && compare_tree_int (tmp, numiter) > 0)
2065                         {
2066                           free_conflict_function (*overlaps_a);
2067                           free_conflict_function (*overlaps_b);
2068                           *overlaps_a = conflict_fn_no_dependence ();
2069                           *overlaps_b = conflict_fn_no_dependence ();
2070                           *last_conflicts = integer_zero_node;
2071                           dependence_stats.num_siv_independent++;
2072                           return;
2073                         }
2074                       dependence_stats.num_siv_dependent++;
2075                       return;
2076                     }
2077
2078                   /* When the step does not divide the difference, there
2079                      are no overlaps.  */
2080                   else
2081                     {
2082                       *overlaps_a = conflict_fn_no_dependence ();
2083                       *overlaps_b = conflict_fn_no_dependence ();
2084                       *last_conflicts = integer_zero_node;
2085                       dependence_stats.num_siv_independent++;
2086                       return;
2087                     }
2088                 }
2089               else
2090                 {
2091                   /* Example:
2092                      chrec_a = 3
2093                      chrec_b = {4, +, 1}
2094
2095                      In this case, chrec_a will not overlap with chrec_b.  */
2096                   *overlaps_a = conflict_fn_no_dependence ();
2097                   *overlaps_b = conflict_fn_no_dependence ();
2098                   *last_conflicts = integer_zero_node;
2099                   dependence_stats.num_siv_independent++;
2100                   return;
2101                 }
2102             }
2103         }
2104     }
2105 }
2106
2107 /* Helper recursive function for initializing the matrix A.  Returns
2108    the initial value of CHREC.  */
2109
2110 static tree
2111 initialize_matrix_A (lambda_matrix A, tree chrec, unsigned index, int mult)
2112 {
2113   gcc_assert (chrec);
2114
2115   switch (TREE_CODE (chrec))
2116     {
2117     case POLYNOMIAL_CHREC:
2118       gcc_assert (TREE_CODE (CHREC_RIGHT (chrec)) == INTEGER_CST);
2119
2120       A[index][0] = mult * int_cst_value (CHREC_RIGHT (chrec));
2121       return initialize_matrix_A (A, CHREC_LEFT (chrec), index + 1, mult);
2122
2123     case PLUS_EXPR:
2124     case MULT_EXPR:
2125     case MINUS_EXPR:
2126       {
2127         tree op0 = initialize_matrix_A (A, TREE_OPERAND (chrec, 0), index, mult);
2128         tree op1 = initialize_matrix_A (A, TREE_OPERAND (chrec, 1), index, mult);
2129
2130         return chrec_fold_op (TREE_CODE (chrec), chrec_type (chrec), op0, op1);
2131       }
2132
2133     CASE_CONVERT:
2134       {
2135         tree op = initialize_matrix_A (A, TREE_OPERAND (chrec, 0), index, mult);
2136         return chrec_convert (chrec_type (chrec), op, NULL);
2137       }
2138
2139     case BIT_NOT_EXPR:
2140       {
2141         /* Handle ~X as -1 - X.  */
2142         tree op = initialize_matrix_A (A, TREE_OPERAND (chrec, 0), index, mult);
2143         return chrec_fold_op (MINUS_EXPR, chrec_type (chrec),
2144                               build_int_cst (TREE_TYPE (chrec), -1), op);
2145       }
2146
2147     case INTEGER_CST:
2148       return chrec;
2149
2150     default:
2151       gcc_unreachable ();
2152       return NULL_TREE;
2153     }
2154 }
2155
2156 #define FLOOR_DIV(x,y) ((x) / (y))
2157
2158 /* Solves the special case of the Diophantine equation:
2159    | {0, +, STEP_A}_x (OVERLAPS_A) = {0, +, STEP_B}_y (OVERLAPS_B)
2160
2161    Computes the descriptions OVERLAPS_A and OVERLAPS_B.  NITER is the
2162    number of iterations that loops X and Y run.  The overlaps will be
2163    constructed as evolutions in dimension DIM.  */
2164
2165 static void
2166 compute_overlap_steps_for_affine_univar (int niter, int step_a, int step_b,
2167                                          affine_fn *overlaps_a,
2168                                          affine_fn *overlaps_b,
2169                                          tree *last_conflicts, int dim)
2170 {
2171   if (((step_a > 0 && step_b > 0)
2172        || (step_a < 0 && step_b < 0)))
2173     {
2174       int step_overlaps_a, step_overlaps_b;
2175       int gcd_steps_a_b, last_conflict, tau2;
2176
2177       gcd_steps_a_b = gcd (step_a, step_b);
2178       step_overlaps_a = step_b / gcd_steps_a_b;
2179       step_overlaps_b = step_a / gcd_steps_a_b;
2180
2181       if (niter > 0)
2182         {
2183           tau2 = FLOOR_DIV (niter, step_overlaps_a);
2184           tau2 = MIN (tau2, FLOOR_DIV (niter, step_overlaps_b));
2185           last_conflict = tau2;
2186           *last_conflicts = build_int_cst (NULL_TREE, last_conflict);
2187         }
2188       else
2189         *last_conflicts = chrec_dont_know;
2190
2191       *overlaps_a = affine_fn_univar (integer_zero_node, dim,
2192                                       build_int_cst (NULL_TREE,
2193                                                      step_overlaps_a));
2194       *overlaps_b = affine_fn_univar (integer_zero_node, dim,
2195                                       build_int_cst (NULL_TREE,
2196                                                      step_overlaps_b));
2197     }
2198
2199   else
2200     {
2201       *overlaps_a = affine_fn_cst (integer_zero_node);
2202       *overlaps_b = affine_fn_cst (integer_zero_node);
2203       *last_conflicts = integer_zero_node;
2204     }
2205 }
2206
2207 /* Solves the special case of a Diophantine equation where CHREC_A is
2208    an affine bivariate function, and CHREC_B is an affine univariate
2209    function.  For example,
2210
2211    | {{0, +, 1}_x, +, 1335}_y = {0, +, 1336}_z
2212
2213    has the following overlapping functions:
2214
2215    | x (t, u, v) = {{0, +, 1336}_t, +, 1}_v
2216    | y (t, u, v) = {{0, +, 1336}_u, +, 1}_v
2217    | z (t, u, v) = {{{0, +, 1}_t, +, 1335}_u, +, 1}_v
2218
2219    FORNOW: This is a specialized implementation for a case occurring in
2220    a common benchmark.  Implement the general algorithm.  */
2221
2222 static void
2223 compute_overlap_steps_for_affine_1_2 (tree chrec_a, tree chrec_b,
2224                                       conflict_function **overlaps_a,
2225                                       conflict_function **overlaps_b,
2226                                       tree *last_conflicts)
2227 {
2228   bool xz_p, yz_p, xyz_p;
2229   int step_x, step_y, step_z;
2230   HOST_WIDE_INT niter_x, niter_y, niter_z, niter;
2231   affine_fn overlaps_a_xz, overlaps_b_xz;
2232   affine_fn overlaps_a_yz, overlaps_b_yz;
2233   affine_fn overlaps_a_xyz, overlaps_b_xyz;
2234   affine_fn ova1, ova2, ovb;
2235   tree last_conflicts_xz, last_conflicts_yz, last_conflicts_xyz;
2236
2237   step_x = int_cst_value (CHREC_RIGHT (CHREC_LEFT (chrec_a)));
2238   step_y = int_cst_value (CHREC_RIGHT (chrec_a));
2239   step_z = int_cst_value (CHREC_RIGHT (chrec_b));
2240
2241   niter_x = max_stmt_executions_int (get_chrec_loop (CHREC_LEFT (chrec_a)));
2242   niter_y = max_stmt_executions_int (get_chrec_loop (chrec_a));
2243   niter_z = max_stmt_executions_int (get_chrec_loop (chrec_b));
2244
2245   if (niter_x < 0 || niter_y < 0 || niter_z < 0)
2246     {
2247       if (dump_file && (dump_flags & TDF_DETAILS))
2248         fprintf (dump_file, "overlap steps test failed: no iteration counts.\n");
2249
2250       *overlaps_a = conflict_fn_not_known ();
2251       *overlaps_b = conflict_fn_not_known ();
2252       *last_conflicts = chrec_dont_know;
2253       return;
2254     }
2255
2256   niter = MIN (niter_x, niter_z);
2257   compute_overlap_steps_for_affine_univar (niter, step_x, step_z,
2258                                            &overlaps_a_xz,
2259                                            &overlaps_b_xz,
2260                                            &last_conflicts_xz, 1);
2261   niter = MIN (niter_y, niter_z);
2262   compute_overlap_steps_for_affine_univar (niter, step_y, step_z,
2263                                            &overlaps_a_yz,
2264                                            &overlaps_b_yz,
2265                                            &last_conflicts_yz, 2);
2266   niter = MIN (niter_x, niter_z);
2267   niter = MIN (niter_y, niter);
2268   compute_overlap_steps_for_affine_univar (niter, step_x + step_y, step_z,
2269                                            &overlaps_a_xyz,
2270                                            &overlaps_b_xyz,
2271                                            &last_conflicts_xyz, 3);
2272
2273   xz_p = !integer_zerop (last_conflicts_xz);
2274   yz_p = !integer_zerop (last_conflicts_yz);
2275   xyz_p = !integer_zerop (last_conflicts_xyz);
2276
2277   if (xz_p || yz_p || xyz_p)
2278     {
2279       ova1 = affine_fn_cst (integer_zero_node);
2280       ova2 = affine_fn_cst (integer_zero_node);
2281       ovb = affine_fn_cst (integer_zero_node);
2282       if (xz_p)
2283         {
2284           affine_fn t0 = ova1;
2285           affine_fn t2 = ovb;
2286
2287           ova1 = affine_fn_plus (ova1, overlaps_a_xz);
2288           ovb = affine_fn_plus (ovb, overlaps_b_xz);
2289           affine_fn_free (t0);
2290           affine_fn_free (t2);
2291           *last_conflicts = last_conflicts_xz;
2292         }
2293       if (yz_p)
2294         {
2295           affine_fn t0 = ova2;
2296           affine_fn t2 = ovb;
2297
2298           ova2 = affine_fn_plus (ova2, overlaps_a_yz);
2299           ovb = affine_fn_plus (ovb, overlaps_b_yz);
2300           affine_fn_free (t0);
2301           affine_fn_free (t2);
2302           *last_conflicts = last_conflicts_yz;
2303         }
2304       if (xyz_p)
2305         {
2306           affine_fn t0 = ova1;
2307           affine_fn t2 = ova2;
2308           affine_fn t4 = ovb;
2309
2310           ova1 = affine_fn_plus (ova1, overlaps_a_xyz);
2311           ova2 = affine_fn_plus (ova2, overlaps_a_xyz);
2312           ovb = affine_fn_plus (ovb, overlaps_b_xyz);
2313           affine_fn_free (t0);
2314           affine_fn_free (t2);
2315           affine_fn_free (t4);
2316           *last_conflicts = last_conflicts_xyz;
2317         }
2318       *overlaps_a = conflict_fn (2, ova1, ova2);
2319       *overlaps_b = conflict_fn (1, ovb);
2320     }
2321   else
2322     {
2323       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2324       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
2325       *last_conflicts = integer_zero_node;
2326     }
2327
2328   affine_fn_free (overlaps_a_xz);
2329   affine_fn_free (overlaps_b_xz);
2330   affine_fn_free (overlaps_a_yz);
2331   affine_fn_free (overlaps_b_yz);
2332   affine_fn_free (overlaps_a_xyz);
2333   affine_fn_free (overlaps_b_xyz);
2334 }
2335
2336 /* Copy the elements of vector VEC1 with length SIZE to VEC2.  */
2337
2338 static void
2339 lambda_vector_copy (lambda_vector vec1, lambda_vector vec2,
2340                     int size)
2341 {
2342   memcpy (vec2, vec1, size * sizeof (*vec1));
2343 }
2344
2345 /* Copy the elements of M x N matrix MAT1 to MAT2.  */
2346
2347 static void
2348 lambda_matrix_copy (lambda_matrix mat1, lambda_matrix mat2,
2349                     int m, int n)
2350 {
2351   int i;
2352
2353   for (i = 0; i < m; i++)
2354     lambda_vector_copy (mat1[i], mat2[i], n);
2355 }
2356
2357 /* Store the N x N identity matrix in MAT.  */
2358
2359 static void
2360 lambda_matrix_id (lambda_matrix mat, int size)
2361 {
2362   int i, j;
2363
2364   for (i = 0; i < size; i++)
2365     for (j = 0; j < size; j++)
2366       mat[i][j] = (i == j) ? 1 : 0;
2367 }
2368
2369 /* Return the first nonzero element of vector VEC1 between START and N.
2370    We must have START <= N.   Returns N if VEC1 is the zero vector.  */
2371
2372 static int
2373 lambda_vector_first_nz (lambda_vector vec1, int n, int start)
2374 {
2375   int j = start;
2376   while (j < n && vec1[j] == 0)
2377     j++;
2378   return j;
2379 }
2380
2381 /* Add a multiple of row R1 of matrix MAT with N columns to row R2:
2382    R2 = R2 + CONST1 * R1.  */
2383
2384 static void
2385 lambda_matrix_row_add (lambda_matrix mat, int n, int r1, int r2, int const1)
2386 {
2387   int i;
2388
2389   if (const1 == 0)
2390     return;
2391
2392   for (i = 0; i < n; i++)
2393     mat[r2][i] += const1 * mat[r1][i];
2394 }
2395
2396 /* Multiply vector VEC1 of length SIZE by a constant CONST1,
2397    and store the result in VEC2.  */
2398
2399 static void
2400 lambda_vector_mult_const (lambda_vector vec1, lambda_vector vec2,
2401                           int size, int const1)
2402 {
2403   int i;
2404
2405   if (const1 == 0)
2406     lambda_vector_clear (vec2, size);
2407   else
2408     for (i = 0; i < size; i++)
2409       vec2[i] = const1 * vec1[i];
2410 }
2411
2412 /* Negate vector VEC1 with length SIZE and store it in VEC2.  */
2413
2414 static void
2415 lambda_vector_negate (lambda_vector vec1, lambda_vector vec2,
2416                       int size)
2417 {
2418   lambda_vector_mult_const (vec1, vec2, size, -1);
2419 }
2420
2421 /* Negate row R1 of matrix MAT which has N columns.  */
2422
2423 static void
2424 lambda_matrix_row_negate (lambda_matrix mat, int n, int r1)
2425 {
2426   lambda_vector_negate (mat[r1], mat[r1], n);
2427 }
2428
2429 /* Return true if two vectors are equal.  */
2430
2431 static bool
2432 lambda_vector_equal (lambda_vector vec1, lambda_vector vec2, int size)
2433 {
2434   int i;
2435   for (i = 0; i < size; i++)
2436     if (vec1[i] != vec2[i])
2437       return false;
2438   return true;
2439 }
2440
2441 /* Given an M x N integer matrix A, this function determines an M x
2442    M unimodular matrix U, and an M x N echelon matrix S such that
2443    "U.A = S".  This decomposition is also known as "right Hermite".
2444
2445    Ref: Algorithm 2.1 page 33 in "Loop Transformations for
2446    Restructuring Compilers" Utpal Banerjee.  */
2447
2448 static void
2449 lambda_matrix_right_hermite (lambda_matrix A, int m, int n,
2450                              lambda_matrix S, lambda_matrix U)
2451 {
2452   int i, j, i0 = 0;
2453
2454   lambda_matrix_copy (A, S, m, n);
2455   lambda_matrix_id (U, m);
2456
2457   for (j = 0; j < n; j++)
2458     {
2459       if (lambda_vector_first_nz (S[j], m, i0) < m)
2460         {
2461           ++i0;
2462           for (i = m - 1; i >= i0; i--)
2463             {
2464               while (S[i][j] != 0)
2465                 {
2466                   int sigma, factor, a, b;
2467
2468                   a = S[i-1][j];
2469                   b = S[i][j];
2470                   sigma = (a * b < 0) ? -1: 1;
2471                   a = abs (a);
2472                   b = abs (b);
2473                   factor = sigma * (a / b);
2474
2475                   lambda_matrix_row_add (S, n, i, i-1, -factor);
2476                   std::swap (S[i], S[i-1]);
2477
2478                   lambda_matrix_row_add (U, m, i, i-1, -factor);
2479                   std::swap (U[i], U[i-1]);
2480                 }
2481             }
2482         }
2483     }
2484 }
2485
2486 /* Determines the overlapping elements due to accesses CHREC_A and
2487    CHREC_B, that are affine functions.  This function cannot handle
2488    symbolic evolution functions, ie. when initial conditions are
2489    parameters, because it uses lambda matrices of integers.  */
2490
2491 static void
2492 analyze_subscript_affine_affine (tree chrec_a,
2493                                  tree chrec_b,
2494                                  conflict_function **overlaps_a,
2495                                  conflict_function **overlaps_b,
2496                                  tree *last_conflicts)
2497 {
2498   unsigned nb_vars_a, nb_vars_b, dim;
2499   HOST_WIDE_INT init_a, init_b, gamma, gcd_alpha_beta;
2500   lambda_matrix A, U, S;
2501   struct obstack scratch_obstack;
2502
2503   if (eq_evolutions_p (chrec_a, chrec_b))
2504     {
2505       /* The accessed index overlaps for each iteration in the
2506          loop.  */
2507       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2508       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
2509       *last_conflicts = chrec_dont_know;
2510       return;
2511     }
2512   if (dump_file && (dump_flags & TDF_DETAILS))
2513     fprintf (dump_file, "(analyze_subscript_affine_affine \n");
2514
2515   /* For determining the initial intersection, we have to solve a
2516      Diophantine equation.  This is the most time consuming part.
2517
2518      For answering to the question: "Is there a dependence?" we have
2519      to prove that there exists a solution to the Diophantine
2520      equation, and that the solution is in the iteration domain,
2521      i.e. the solution is positive or zero, and that the solution
2522      happens before the upper bound loop.nb_iterations.  Otherwise
2523      there is no dependence.  This function outputs a description of
2524      the iterations that hold the intersections.  */
2525
2526   nb_vars_a = nb_vars_in_chrec (chrec_a);
2527   nb_vars_b = nb_vars_in_chrec (chrec_b);
2528
2529   gcc_obstack_init (&scratch_obstack);
2530
2531   dim = nb_vars_a + nb_vars_b;
2532   U = lambda_matrix_new (dim, dim, &scratch_obstack);
2533   A = lambda_matrix_new (dim, 1, &scratch_obstack);
2534   S = lambda_matrix_new (dim, 1, &scratch_obstack);
2535
2536   init_a = int_cst_value (initialize_matrix_A (A, chrec_a, 0, 1));
2537   init_b = int_cst_value (initialize_matrix_A (A, chrec_b, nb_vars_a, -1));
2538   gamma = init_b - init_a;
2539
2540   /* Don't do all the hard work of solving the Diophantine equation
2541      when we already know the solution: for example,
2542      | {3, +, 1}_1
2543      | {3, +, 4}_2
2544      | gamma = 3 - 3 = 0.
2545      Then the first overlap occurs during the first iterations:
2546      | {3, +, 1}_1 ({0, +, 4}_x) = {3, +, 4}_2 ({0, +, 1}_x)
2547   */
2548   if (gamma == 0)
2549     {
2550       if (nb_vars_a == 1 && nb_vars_b == 1)
2551         {
2552           HOST_WIDE_INT step_a, step_b;
2553           HOST_WIDE_INT niter, niter_a, niter_b;
2554           affine_fn ova, ovb;
2555
2556           niter_a = max_stmt_executions_int (get_chrec_loop (chrec_a));
2557           niter_b = max_stmt_executions_int (get_chrec_loop (chrec_b));
2558           niter = MIN (niter_a, niter_b);
2559           step_a = int_cst_value (CHREC_RIGHT (chrec_a));
2560           step_b = int_cst_value (CHREC_RIGHT (chrec_b));
2561
2562           compute_overlap_steps_for_affine_univar (niter, step_a, step_b,
2563                                                    &ova, &ovb,
2564                                                    last_conflicts, 1);
2565           *overlaps_a = conflict_fn (1, ova);
2566           *overlaps_b = conflict_fn (1, ovb);
2567         }
2568
2569       else if (nb_vars_a == 2 && nb_vars_b == 1)
2570         compute_overlap_steps_for_affine_1_2
2571           (chrec_a, chrec_b, overlaps_a, overlaps_b, last_conflicts);
2572
2573       else if (nb_vars_a == 1 && nb_vars_b == 2)
2574         compute_overlap_steps_for_affine_1_2
2575           (chrec_b, chrec_a, overlaps_b, overlaps_a, last_conflicts);
2576
2577       else
2578         {
2579           if (dump_file && (dump_flags & TDF_DETAILS))
2580             fprintf (dump_file, "affine-affine test failed: too many variables.\n");
2581           *overlaps_a = conflict_fn_not_known ();
2582           *overlaps_b = conflict_fn_not_known ();
2583           *last_conflicts = chrec_dont_know;
2584         }
2585       goto end_analyze_subs_aa;
2586     }
2587
2588   /* U.A = S */
2589   lambda_matrix_right_hermite (A, dim, 1, S, U);
2590
2591   if (S[0][0] < 0)
2592     {
2593       S[0][0] *= -1;
2594       lambda_matrix_row_negate (U, dim, 0);
2595     }
2596   gcd_alpha_beta = S[0][0];
2597
2598   /* Something went wrong: for example in {1, +, 0}_5 vs. {0, +, 0}_5,
2599      but that is a quite strange case.  Instead of ICEing, answer
2600      don't know.  */
2601   if (gcd_alpha_beta == 0)
2602     {
2603       *overlaps_a = conflict_fn_not_known ();
2604       *overlaps_b = conflict_fn_not_known ();
2605       *last_conflicts = chrec_dont_know;
2606       goto end_analyze_subs_aa;
2607     }
2608
2609   /* The classic "gcd-test".  */
2610   if (!int_divides_p (gcd_alpha_beta, gamma))
2611     {
2612       /* The "gcd-test" has determined that there is no integer
2613          solution, i.e. there is no dependence.  */
2614       *overlaps_a = conflict_fn_no_dependence ();
2615       *overlaps_b = conflict_fn_no_dependence ();
2616       *last_conflicts = integer_zero_node;
2617     }
2618
2619   /* Both access functions are univariate.  This includes SIV and MIV cases.  */
2620   else if (nb_vars_a == 1 && nb_vars_b == 1)
2621     {
2622       /* Both functions should have the same evolution sign.  */
2623       if (((A[0][0] > 0 && -A[1][0] > 0)
2624            || (A[0][0] < 0 && -A[1][0] < 0)))
2625         {
2626           /* The solutions are given by:
2627              |
2628              | [GAMMA/GCD_ALPHA_BETA  t].[u11 u12]  = [x0]
2629              |                           [u21 u22]    [y0]
2630
2631              For a given integer t.  Using the following variables,
2632
2633              | i0 = u11 * gamma / gcd_alpha_beta
2634              | j0 = u12 * gamma / gcd_alpha_beta
2635              | i1 = u21
2636              | j1 = u22
2637
2638              the solutions are:
2639
2640              | x0 = i0 + i1 * t,
2641              | y0 = j0 + j1 * t.  */
2642           HOST_WIDE_INT i0, j0, i1, j1;
2643
2644           i0 = U[0][0] * gamma / gcd_alpha_beta;
2645           j0 = U[0][1] * gamma / gcd_alpha_beta;
2646           i1 = U[1][0];
2647           j1 = U[1][1];
2648
2649           if ((i1 == 0 && i0 < 0)
2650               || (j1 == 0 && j0 < 0))
2651             {
2652               /* There is no solution.
2653                  FIXME: The case "i0 > nb_iterations, j0 > nb_iterations"
2654                  falls in here, but for the moment we don't look at the
2655                  upper bound of the iteration domain.  */
2656               *overlaps_a = conflict_fn_no_dependence ();
2657               *overlaps_b = conflict_fn_no_dependence ();
2658               *last_conflicts = integer_zero_node;
2659               goto end_analyze_subs_aa;
2660             }
2661
2662           if (i1 > 0 && j1 > 0)
2663             {
2664               HOST_WIDE_INT niter_a
2665                 = max_stmt_executions_int (get_chrec_loop (chrec_a));
2666               HOST_WIDE_INT niter_b
2667                 = max_stmt_executions_int (get_chrec_loop (chrec_b));
2668               HOST_WIDE_INT niter = MIN (niter_a, niter_b);
2669
2670               /* (X0, Y0) is a solution of the Diophantine equation:
2671                  "chrec_a (X0) = chrec_b (Y0)".  */
2672               HOST_WIDE_INT tau1 = MAX (CEIL (-i0, i1),
2673                                         CEIL (-j0, j1));
2674               HOST_WIDE_INT x0 = i1 * tau1 + i0;
2675               HOST_WIDE_INT y0 = j1 * tau1 + j0;
2676
2677               /* (X1, Y1) is the smallest positive solution of the eq
2678                  "chrec_a (X1) = chrec_b (Y1)", i.e. this is where the
2679                  first conflict occurs.  */
2680               HOST_WIDE_INT min_multiple = MIN (x0 / i1, y0 / j1);
2681               HOST_WIDE_INT x1 = x0 - i1 * min_multiple;
2682               HOST_WIDE_INT y1 = y0 - j1 * min_multiple;
2683
2684               if (niter > 0)
2685                 {
2686                   HOST_WIDE_INT tau2 = MIN (FLOOR_DIV (niter - i0, i1),
2687                                             FLOOR_DIV (niter - j0, j1));
2688                   HOST_WIDE_INT last_conflict = tau2 - (x1 - i0)/i1;
2689
2690                   /* If the overlap occurs outside of the bounds of the
2691                      loop, there is no dependence.  */
2692                   if (x1 >= niter || y1 >= niter)
2693                     {
2694                       *overlaps_a = conflict_fn_no_dependence ();
2695                       *overlaps_b = conflict_fn_no_dependence ();
2696                       *last_conflicts = integer_zero_node;
2697                       goto end_analyze_subs_aa;
2698                     }
2699                   else
2700                     *last_conflicts = build_int_cst (NULL_TREE, last_conflict);
2701                 }
2702               else
2703                 *last_conflicts = chrec_dont_know;
2704
2705               *overlaps_a
2706                 = conflict_fn (1,
2707                                affine_fn_univar (build_int_cst (NULL_TREE, x1),
2708                                                  1,
2709                                                  build_int_cst (NULL_TREE, i1)));
2710               *overlaps_b
2711                 = conflict_fn (1,
2712                                affine_fn_univar (build_int_cst (NULL_TREE, y1),
2713                                                  1,
2714                                                  build_int_cst (NULL_TREE, j1)));
2715             }
2716           else
2717             {
2718               /* FIXME: For the moment, the upper bound of the
2719                  iteration domain for i and j is not checked.  */
2720               if (dump_file && (dump_flags & TDF_DETAILS))
2721                 fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2722               *overlaps_a = conflict_fn_not_known ();
2723               *overlaps_b = conflict_fn_not_known ();
2724               *last_conflicts = chrec_dont_know;
2725             }
2726         }
2727       else
2728         {
2729           if (dump_file && (dump_flags & TDF_DETAILS))
2730             fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2731           *overlaps_a = conflict_fn_not_known ();
2732           *overlaps_b = conflict_fn_not_known ();
2733           *last_conflicts = chrec_dont_know;
2734         }
2735     }
2736   else
2737     {
2738       if (dump_file && (dump_flags & TDF_DETAILS))
2739         fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2740       *overlaps_a = conflict_fn_not_known ();
2741       *overlaps_b = conflict_fn_not_known ();
2742       *last_conflicts = chrec_dont_know;
2743     }
2744
2745 end_analyze_subs_aa:
2746   obstack_free (&scratch_obstack, NULL);
2747   if (dump_file && (dump_flags & TDF_DETAILS))
2748     {
2749       fprintf (dump_file, "  (overlaps_a = ");
2750       dump_conflict_function (dump_file, *overlaps_a);
2751       fprintf (dump_file, ")\n  (overlaps_b = ");
2752       dump_conflict_function (dump_file, *overlaps_b);
2753       fprintf (dump_file, "))\n");
2754     }
2755 }
2756
2757 /* Returns true when analyze_subscript_affine_affine can be used for
2758    determining the dependence relation between chrec_a and chrec_b,
2759    that contain symbols.  This function modifies chrec_a and chrec_b
2760    such that the analysis result is the same, and such that they don't
2761    contain symbols, and then can safely be passed to the analyzer.
2762
2763    Example: The analysis of the following tuples of evolutions produce
2764    the same results: {x+1, +, 1}_1 vs. {x+3, +, 1}_1, and {-2, +, 1}_1
2765    vs. {0, +, 1}_1
2766
2767    {x+1, +, 1}_1 ({2, +, 1}_1) = {x+3, +, 1}_1 ({0, +, 1}_1)
2768    {-2, +, 1}_1 ({2, +, 1}_1) = {0, +, 1}_1 ({0, +, 1}_1)
2769 */
2770
2771 static bool
2772 can_use_analyze_subscript_affine_affine (tree *chrec_a, tree *chrec_b)
2773 {
2774   tree diff, type, left_a, left_b, right_b;
2775
2776   if (chrec_contains_symbols (CHREC_RIGHT (*chrec_a))
2777       || chrec_contains_symbols (CHREC_RIGHT (*chrec_b)))
2778     /* FIXME: For the moment not handled.  Might be refined later.  */
2779     return false;
2780
2781   type = chrec_type (*chrec_a);
2782   left_a = CHREC_LEFT (*chrec_a);
2783   left_b = chrec_convert (type, CHREC_LEFT (*chrec_b), NULL);
2784   diff = chrec_fold_minus (type, left_a, left_b);
2785
2786   if (!evolution_function_is_constant_p (diff))
2787     return false;
2788
2789   if (dump_file && (dump_flags & TDF_DETAILS))
2790     fprintf (dump_file, "can_use_subscript_aff_aff_for_symbolic \n");
2791
2792   *chrec_a = build_polynomial_chrec (CHREC_VARIABLE (*chrec_a),
2793                                      diff, CHREC_RIGHT (*chrec_a));
2794   right_b = chrec_convert (type, CHREC_RIGHT (*chrec_b), NULL);
2795   *chrec_b = build_polynomial_chrec (CHREC_VARIABLE (*chrec_b),
2796                                      build_int_cst (type, 0),
2797                                      right_b);
2798   return true;
2799 }
2800
2801 /* Analyze a SIV (Single Index Variable) subscript.  *OVERLAPS_A and
2802    *OVERLAPS_B are initialized to the functions that describe the
2803    relation between the elements accessed twice by CHREC_A and
2804    CHREC_B.  For k >= 0, the following property is verified:
2805
2806    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
2807
2808 static void
2809 analyze_siv_subscript (tree chrec_a,
2810                        tree chrec_b,
2811                        conflict_function **overlaps_a,
2812                        conflict_function **overlaps_b,
2813                        tree *last_conflicts,
2814                        int loop_nest_num)
2815 {
2816   dependence_stats.num_siv++;
2817
2818   if (dump_file && (dump_flags & TDF_DETAILS))
2819     fprintf (dump_file, "(analyze_siv_subscript \n");
2820
2821   if (evolution_function_is_constant_p (chrec_a)
2822       && evolution_function_is_affine_in_loop (chrec_b, loop_nest_num))
2823     analyze_siv_subscript_cst_affine (chrec_a, chrec_b,
2824                                       overlaps_a, overlaps_b, last_conflicts);
2825
2826   else if (evolution_function_is_affine_in_loop (chrec_a, loop_nest_num)
2827            && evolution_function_is_constant_p (chrec_b))
2828     analyze_siv_subscript_cst_affine (chrec_b, chrec_a,
2829                                       overlaps_b, overlaps_a, last_conflicts);
2830
2831   else if (evolution_function_is_affine_in_loop (chrec_a, loop_nest_num)
2832            && evolution_function_is_affine_in_loop (chrec_b, loop_nest_num))
2833     {
2834       if (!chrec_contains_symbols (chrec_a)
2835           && !chrec_contains_symbols (chrec_b))
2836         {
2837           analyze_subscript_affine_affine (chrec_a, chrec_b,
2838                                            overlaps_a, overlaps_b,
2839                                            last_conflicts);
2840
2841           if (CF_NOT_KNOWN_P (*overlaps_a)
2842               || CF_NOT_KNOWN_P (*overlaps_b))
2843             dependence_stats.num_siv_unimplemented++;
2844           else if (CF_NO_DEPENDENCE_P (*overlaps_a)
2845                    || CF_NO_DEPENDENCE_P (*overlaps_b))
2846             dependence_stats.num_siv_independent++;
2847           else
2848             dependence_stats.num_siv_dependent++;
2849         }
2850       else if (can_use_analyze_subscript_affine_affine (&chrec_a,
2851                                                         &chrec_b))
2852         {
2853           analyze_subscript_affine_affine (chrec_a, chrec_b,
2854                                            overlaps_a, overlaps_b,
2855                                            last_conflicts);
2856
2857           if (CF_NOT_KNOWN_P (*overlaps_a)
2858               || CF_NOT_KNOWN_P (*overlaps_b))
2859             dependence_stats.num_siv_unimplemented++;
2860           else if (CF_NO_DEPENDENCE_P (*overlaps_a)
2861                    || CF_NO_DEPENDENCE_P (*overlaps_b))
2862             dependence_stats.num_siv_independent++;
2863           else
2864             dependence_stats.num_siv_dependent++;
2865         }
2866       else
2867         goto siv_subscript_dontknow;
2868     }
2869
2870   else
2871     {
2872     siv_subscript_dontknow:;
2873       if (dump_file && (dump_flags & TDF_DETAILS))
2874         fprintf (dump_file, "  siv test failed: unimplemented");
2875       *overlaps_a = conflict_fn_not_known ();
2876       *overlaps_b = conflict_fn_not_known ();
2877       *last_conflicts = chrec_dont_know;
2878       dependence_stats.num_siv_unimplemented++;
2879     }
2880
2881   if (dump_file && (dump_flags & TDF_DETAILS))
2882     fprintf (dump_file, ")\n");
2883 }
2884
2885 /* Returns false if we can prove that the greatest common divisor of the steps
2886    of CHREC does not divide CST, false otherwise.  */
2887
2888 static bool
2889 gcd_of_steps_may_divide_p (const_tree chrec, const_tree cst)
2890 {
2891   HOST_WIDE_INT cd = 0, val;
2892   tree step;
2893
2894   if (!tree_fits_shwi_p (cst))
2895     return true;
2896   val = tree_to_shwi (cst);
2897
2898   while (TREE_CODE (chrec) == POLYNOMIAL_CHREC)
2899     {
2900       step = CHREC_RIGHT (chrec);
2901       if (!tree_fits_shwi_p (step))
2902         return true;
2903       cd = gcd (cd, tree_to_shwi (step));
2904       chrec = CHREC_LEFT (chrec);
2905     }
2906
2907   return val % cd == 0;
2908 }
2909
2910 /* Analyze a MIV (Multiple Index Variable) subscript with respect to
2911    LOOP_NEST.  *OVERLAPS_A and *OVERLAPS_B are initialized to the
2912    functions that describe the relation between the elements accessed
2913    twice by CHREC_A and CHREC_B.  For k >= 0, the following property
2914    is verified:
2915
2916    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
2917
2918 static void
2919 analyze_miv_subscript (tree chrec_a,
2920                        tree chrec_b,
2921                        conflict_function **overlaps_a,
2922                        conflict_function **overlaps_b,
2923                        tree *last_conflicts,
2924                        struct loop *loop_nest)
2925 {
2926   tree type, difference;
2927
2928   dependence_stats.num_miv++;
2929   if (dump_file && (dump_flags & TDF_DETAILS))
2930     fprintf (dump_file, "(analyze_miv_subscript \n");
2931
2932   type = signed_type_for_types (TREE_TYPE (chrec_a), TREE_TYPE (chrec_b));
2933   chrec_a = chrec_convert (type, chrec_a, NULL);
2934   chrec_b = chrec_convert (type, chrec_b, NULL);
2935   difference = chrec_fold_minus (type, chrec_a, chrec_b);
2936
2937   if (eq_evolutions_p (chrec_a, chrec_b))
2938     {
2939       /* Access functions are the same: all the elements are accessed
2940          in the same order.  */
2941       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2942       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
2943       *last_conflicts = max_stmt_executions_tree (get_chrec_loop (chrec_a));
2944       dependence_stats.num_miv_dependent++;
2945     }
2946
2947   else if (evolution_function_is_constant_p (difference)
2948            /* For the moment, the following is verified:
2949               evolution_function_is_affine_multivariate_p (chrec_a,
2950               loop_nest->num) */
2951            && !gcd_of_steps_may_divide_p (chrec_a, difference))
2952     {
2953       /* testsuite/.../ssa-chrec-33.c
2954          {{21, +, 2}_1, +, -2}_2  vs.  {{20, +, 2}_1, +, -2}_2
2955
2956          The difference is 1, and all the evolution steps are multiples
2957          of 2, consequently there are no overlapping elements.  */
2958       *overlaps_a = conflict_fn_no_dependence ();
2959       *overlaps_b = conflict_fn_no_dependence ();
2960       *last_conflicts = integer_zero_node;
2961       dependence_stats.num_miv_independent++;
2962     }
2963
2964   else if (evolution_function_is_affine_multivariate_p (chrec_a, loop_nest->num)
2965            && !chrec_contains_symbols (chrec_a)
2966            && evolution_function_is_affine_multivariate_p (chrec_b, loop_nest->num)
2967            && !chrec_contains_symbols (chrec_b))
2968     {
2969       /* testsuite/.../ssa-chrec-35.c
2970          {0, +, 1}_2  vs.  {0, +, 1}_3
2971          the overlapping elements are respectively located at iterations:
2972          {0, +, 1}_x and {0, +, 1}_x,
2973          in other words, we have the equality:
2974          {0, +, 1}_2 ({0, +, 1}_x) = {0, +, 1}_3 ({0, +, 1}_x)
2975
2976          Other examples:
2977          {{0, +, 1}_1, +, 2}_2 ({0, +, 1}_x, {0, +, 1}_y) =
2978          {0, +, 1}_1 ({{0, +, 1}_x, +, 2}_y)
2979
2980          {{0, +, 2}_1, +, 3}_2 ({0, +, 1}_y, {0, +, 1}_x) =
2981          {{0, +, 3}_1, +, 2}_2 ({0, +, 1}_x, {0, +, 1}_y)
2982       */
2983       analyze_subscript_affine_affine (chrec_a, chrec_b,
2984                                        overlaps_a, overlaps_b, last_conflicts);
2985
2986       if (CF_NOT_KNOWN_P (*overlaps_a)
2987           || CF_NOT_KNOWN_P (*overlaps_b))
2988         dependence_stats.num_miv_unimplemented++;
2989       else if (CF_NO_DEPENDENCE_P (*overlaps_a)
2990                || CF_NO_DEPENDENCE_P (*overlaps_b))
2991         dependence_stats.num_miv_independent++;
2992       else
2993         dependence_stats.num_miv_dependent++;
2994     }
2995
2996   else
2997     {
2998       /* When the analysis is too difficult, answer "don't know".  */
2999       if (dump_file && (dump_flags & TDF_DETAILS))
3000         fprintf (dump_file, "analyze_miv_subscript test failed: unimplemented.\n");
3001
3002       *overlaps_a = conflict_fn_not_known ();
3003       *overlaps_b = conflict_fn_not_known ();
3004       *last_conflicts = chrec_dont_know;
3005       dependence_stats.num_miv_unimplemented++;
3006     }
3007
3008   if (dump_file && (dump_flags & TDF_DETAILS))
3009     fprintf (dump_file, ")\n");
3010 }
3011
3012 /* Determines the iterations for which CHREC_A is equal to CHREC_B in
3013    with respect to LOOP_NEST.  OVERLAP_ITERATIONS_A and
3014    OVERLAP_ITERATIONS_B are initialized with two functions that
3015    describe the iterations that contain conflicting elements.
3016
3017    Remark: For an integer k >= 0, the following equality is true:
3018
3019    CHREC_A (OVERLAP_ITERATIONS_A (k)) == CHREC_B (OVERLAP_ITERATIONS_B (k)).
3020 */
3021
3022 static void
3023 analyze_overlapping_iterations (tree chrec_a,
3024                                 tree chrec_b,
3025                                 conflict_function **overlap_iterations_a,
3026                                 conflict_function **overlap_iterations_b,
3027                                 tree *last_conflicts, struct loop *loop_nest)
3028 {
3029   unsigned int lnn = loop_nest->num;
3030
3031   dependence_stats.num_subscript_tests++;
3032
3033   if (dump_file && (dump_flags & TDF_DETAILS))
3034     {
3035       fprintf (dump_file, "(analyze_overlapping_iterations \n");
3036       fprintf (dump_file, "  (chrec_a = ");
3037       print_generic_expr (dump_file, chrec_a, 0);
3038       fprintf (dump_file, ")\n  (chrec_b = ");
3039       print_generic_expr (dump_file, chrec_b, 0);
3040       fprintf (dump_file, ")\n");
3041     }
3042
3043   if (chrec_a == NULL_TREE
3044       || chrec_b == NULL_TREE
3045       || chrec_contains_undetermined (chrec_a)
3046       || chrec_contains_undetermined (chrec_b))
3047     {
3048       dependence_stats.num_subscript_undetermined++;
3049
3050       *overlap_iterations_a = conflict_fn_not_known ();
3051       *overlap_iterations_b = conflict_fn_not_known ();
3052     }
3053
3054   /* If they are the same chrec, and are affine, they overlap
3055      on every iteration.  */
3056   else if (eq_evolutions_p (chrec_a, chrec_b)
3057            && (evolution_function_is_affine_multivariate_p (chrec_a, lnn)
3058                || operand_equal_p (chrec_a, chrec_b, 0)))
3059     {
3060       dependence_stats.num_same_subscript_function++;
3061       *overlap_iterations_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
3062       *overlap_iterations_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
3063       *last_conflicts = chrec_dont_know;
3064     }
3065
3066   /* If they aren't the same, and aren't affine, we can't do anything
3067      yet.  */
3068   else if ((chrec_contains_symbols (chrec_a)
3069             || chrec_contains_symbols (chrec_b))
3070            && (!evolution_function_is_affine_multivariate_p (chrec_a, lnn)
3071                || !evolution_function_is_affine_multivariate_p (chrec_b, lnn)))
3072     {
3073       dependence_stats.num_subscript_undetermined++;
3074       *overlap_iterations_a = conflict_fn_not_known ();
3075       *overlap_iterations_b = conflict_fn_not_known ();
3076     }
3077
3078   else if (ziv_subscript_p (chrec_a, chrec_b))
3079     analyze_ziv_subscript (chrec_a, chrec_b,
3080                            overlap_iterations_a, overlap_iterations_b,
3081                            last_conflicts);
3082
3083   else if (siv_subscript_p (chrec_a, chrec_b))
3084     analyze_siv_subscript (chrec_a, chrec_b,
3085                            overlap_iterations_a, overlap_iterations_b,
3086                            last_conflicts, lnn);
3087
3088   else
3089     analyze_miv_subscript (chrec_a, chrec_b,
3090                            overlap_iterations_a, overlap_iterations_b,
3091                            last_conflicts, loop_nest);
3092
3093   if (dump_file && (dump_flags & TDF_DETAILS))
3094     {
3095       fprintf (dump_file, "  (overlap_iterations_a = ");
3096       dump_conflict_function (dump_file, *overlap_iterations_a);
3097       fprintf (dump_file, ")\n  (overlap_iterations_b = ");
3098       dump_conflict_function (dump_file, *overlap_iterations_b);
3099       fprintf (dump_file, "))\n");
3100     }
3101 }
3102
3103 /* Helper function for uniquely inserting distance vectors.  */
3104
3105 static void
3106 save_dist_v (struct data_dependence_relation *ddr, lambda_vector dist_v)
3107 {
3108   unsigned i;
3109   lambda_vector v;
3110
3111   FOR_EACH_VEC_ELT (DDR_DIST_VECTS (ddr), i, v)
3112     if (lambda_vector_equal (v, dist_v, DDR_NB_LOOPS (ddr)))
3113       return;
3114
3115   DDR_DIST_VECTS (ddr).safe_push (dist_v);
3116 }
3117
3118 /* Helper function for uniquely inserting direction vectors.  */
3119
3120 static void
3121 save_dir_v (struct data_dependence_relation *ddr, lambda_vector dir_v)
3122 {
3123   unsigned i;
3124   lambda_vector v;
3125
3126   FOR_EACH_VEC_ELT (DDR_DIR_VECTS (ddr), i, v)
3127     if (lambda_vector_equal (v, dir_v, DDR_NB_LOOPS (ddr)))
3128       return;
3129
3130   DDR_DIR_VECTS (ddr).safe_push (dir_v);
3131 }
3132
3133 /* Add a distance of 1 on all the loops outer than INDEX.  If we
3134    haven't yet determined a distance for this outer loop, push a new
3135    distance vector composed of the previous distance, and a distance
3136    of 1 for this outer loop.  Example:
3137
3138    | loop_1
3139    |   loop_2
3140    |     A[10]
3141    |   endloop_2
3142    | endloop_1
3143
3144    Saved vectors are of the form (dist_in_1, dist_in_2).  First, we
3145    save (0, 1), then we have to save (1, 0).  */
3146
3147 static void
3148 add_outer_distances (struct data_dependence_relation *ddr,
3149                      lambda_vector dist_v, int index)
3150 {
3151   /* For each outer loop where init_v is not set, the accesses are
3152      in dependence of distance 1 in the loop.  */
3153   while (--index >= 0)
3154     {
3155       lambda_vector save_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3156       lambda_vector_copy (dist_v, save_v, DDR_NB_LOOPS (ddr));
3157       save_v[index] = 1;
3158       save_dist_v (ddr, save_v);
3159     }
3160 }
3161
3162 /* Return false when fail to represent the data dependence as a
3163    distance vector.  INIT_B is set to true when a component has been
3164    added to the distance vector DIST_V.  INDEX_CARRY is then set to
3165    the index in DIST_V that carries the dependence.  */
3166
3167 static bool
3168 build_classic_dist_vector_1 (struct data_dependence_relation *ddr,
3169                              struct data_reference *ddr_a,
3170                              struct data_reference *ddr_b,
3171                              lambda_vector dist_v, bool *init_b,
3172                              int *index_carry)
3173 {
3174   unsigned i;
3175   lambda_vector init_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3176
3177   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3178     {
3179       tree access_fn_a, access_fn_b;
3180       struct subscript *subscript = DDR_SUBSCRIPT (ddr, i);
3181
3182       if (chrec_contains_undetermined (SUB_DISTANCE (subscript)))
3183         {
3184           non_affine_dependence_relation (ddr);
3185           return false;
3186         }
3187
3188       access_fn_a = DR_ACCESS_FN (ddr_a, i);
3189       access_fn_b = DR_ACCESS_FN (ddr_b, i);
3190
3191       if (TREE_CODE (access_fn_a) == POLYNOMIAL_CHREC
3192           && TREE_CODE (access_fn_b) == POLYNOMIAL_CHREC)
3193         {
3194           int dist, index;
3195           int var_a = CHREC_VARIABLE (access_fn_a);
3196           int var_b = CHREC_VARIABLE (access_fn_b);
3197
3198           if (var_a != var_b
3199               || chrec_contains_undetermined (SUB_DISTANCE (subscript)))
3200             {
3201               non_affine_dependence_relation (ddr);
3202               return false;
3203             }
3204
3205           dist = int_cst_value (SUB_DISTANCE (subscript));
3206           index = index_in_loop_nest (var_a, DDR_LOOP_NEST (ddr));
3207           *index_carry = MIN (index, *index_carry);
3208
3209           /* This is the subscript coupling test.  If we have already
3210              recorded a distance for this loop (a distance coming from
3211              another subscript), it should be the same.  For example,
3212              in the following code, there is no dependence:
3213
3214              | loop i = 0, N, 1
3215              |   T[i+1][i] = ...
3216              |   ... = T[i][i]
3217              | endloop
3218           */
3219           if (init_v[index] != 0 && dist_v[index] != dist)
3220             {
3221               finalize_ddr_dependent (ddr, chrec_known);
3222               return false;
3223             }
3224
3225           dist_v[index] = dist;
3226           init_v[index] = 1;
3227           *init_b = true;
3228         }
3229       else if (!operand_equal_p (access_fn_a, access_fn_b, 0))
3230         {
3231           /* This can be for example an affine vs. constant dependence
3232              (T[i] vs. T[3]) that is not an affine dependence and is
3233              not representable as a distance vector.  */
3234           non_affine_dependence_relation (ddr);
3235           return false;
3236         }
3237     }
3238
3239   return true;
3240 }
3241
3242 /* Return true when the DDR contains only constant access functions.  */
3243
3244 static bool
3245 constant_access_functions (const struct data_dependence_relation *ddr)
3246 {
3247   unsigned i;
3248
3249   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3250     if (!evolution_function_is_constant_p (DR_ACCESS_FN (DDR_A (ddr), i))
3251         || !evolution_function_is_constant_p (DR_ACCESS_FN (DDR_B (ddr), i)))
3252       return false;
3253
3254   return true;
3255 }
3256
3257 /* Helper function for the case where DDR_A and DDR_B are the same
3258    multivariate access function with a constant step.  For an example
3259    see pr34635-1.c.  */
3260
3261 static void
3262 add_multivariate_self_dist (struct data_dependence_relation *ddr, tree c_2)
3263 {
3264   int x_1, x_2;
3265   tree c_1 = CHREC_LEFT (c_2);
3266   tree c_0 = CHREC_LEFT (c_1);
3267   lambda_vector dist_v;
3268   int v1, v2, cd;
3269
3270   /* Polynomials with more than 2 variables are not handled yet.  When
3271      the evolution steps are parameters, it is not possible to
3272      represent the dependence using classical distance vectors.  */
3273   if (TREE_CODE (c_0) != INTEGER_CST
3274       || TREE_CODE (CHREC_RIGHT (c_1)) != INTEGER_CST
3275       || TREE_CODE (CHREC_RIGHT (c_2)) != INTEGER_CST)
3276     {
3277       DDR_AFFINE_P (ddr) = false;
3278       return;
3279     }
3280
3281   x_2 = index_in_loop_nest (CHREC_VARIABLE (c_2), DDR_LOOP_NEST (ddr));
3282   x_1 = index_in_loop_nest (CHREC_VARIABLE (c_1), DDR_LOOP_NEST (ddr));
3283
3284   /* For "{{0, +, 2}_1, +, 3}_2" the distance vector is (3, -2).  */
3285   dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3286   v1 = int_cst_value (CHREC_RIGHT (c_1));
3287   v2 = int_cst_value (CHREC_RIGHT (c_2));
3288   cd = gcd (v1, v2);
3289   v1 /= cd;
3290   v2 /= cd;
3291
3292   if (v2 < 0)
3293     {
3294       v2 = -v2;
3295       v1 = -v1;
3296     }
3297
3298   dist_v[x_1] = v2;
3299   dist_v[x_2] = -v1;
3300   save_dist_v (ddr, dist_v);
3301
3302   add_outer_distances (ddr, dist_v, x_1);
3303 }
3304
3305 /* Helper function for the case where DDR_A and DDR_B are the same
3306    access functions.  */
3307
3308 static void
3309 add_other_self_distances (struct data_dependence_relation *ddr)
3310 {
3311   lambda_vector dist_v;
3312   unsigned i;
3313   int index_carry = DDR_NB_LOOPS (ddr);
3314
3315   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3316     {
3317       tree access_fun = DR_ACCESS_FN (DDR_A (ddr), i);
3318
3319       if (TREE_CODE (access_fun) == POLYNOMIAL_CHREC)
3320         {
3321           if (!evolution_function_is_univariate_p (access_fun))
3322             {
3323               if (DDR_NUM_SUBSCRIPTS (ddr) != 1)
3324                 {
3325                   DDR_ARE_DEPENDENT (ddr) = chrec_dont_know;
3326                   return;
3327                 }
3328
3329               access_fun = DR_ACCESS_FN (DDR_A (ddr), 0);
3330
3331               if (TREE_CODE (CHREC_LEFT (access_fun)) == POLYNOMIAL_CHREC)
3332                 add_multivariate_self_dist (ddr, access_fun);
3333               else
3334                 /* The evolution step is not constant: it varies in
3335                    the outer loop, so this cannot be represented by a
3336                    distance vector.  For example in pr34635.c the
3337                    evolution is {0, +, {0, +, 4}_1}_2.  */
3338                 DDR_AFFINE_P (ddr) = false;
3339
3340               return;
3341             }
3342
3343           index_carry = MIN (index_carry,
3344                              index_in_loop_nest (CHREC_VARIABLE (access_fun),
3345                                                  DDR_LOOP_NEST (ddr)));
3346         }
3347     }
3348
3349   dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3350   add_outer_distances (ddr, dist_v, index_carry);
3351 }
3352
3353 static void
3354 insert_innermost_unit_dist_vector (struct data_dependence_relation *ddr)
3355 {
3356   lambda_vector dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3357
3358   dist_v[DDR_INNER_LOOP (ddr)] = 1;
3359   save_dist_v (ddr, dist_v);
3360 }
3361
3362 /* Adds a unit distance vector to DDR when there is a 0 overlap.  This
3363    is the case for example when access functions are the same and
3364    equal to a constant, as in:
3365
3366    | loop_1
3367    |   A[3] = ...
3368    |   ... = A[3]
3369    | endloop_1
3370
3371    in which case the distance vectors are (0) and (1).  */
3372
3373 static void
3374 add_distance_for_zero_overlaps (struct data_dependence_relation *ddr)
3375 {
3376   unsigned i, j;
3377
3378   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3379     {
3380       subscript_p sub = DDR_SUBSCRIPT (ddr, i);
3381       conflict_function *ca = SUB_CONFLICTS_IN_A (sub);
3382       conflict_function *cb = SUB_CONFLICTS_IN_B (sub);
3383
3384       for (j = 0; j < ca->n; j++)
3385         if (affine_function_zero_p (ca->fns[j]))
3386           {
3387             insert_innermost_unit_dist_vector (ddr);
3388             return;
3389           }
3390
3391       for (j = 0; j < cb->n; j++)
3392         if (affine_function_zero_p (cb->fns[j]))
3393           {
3394             insert_innermost_unit_dist_vector (ddr);
3395             return;
3396           }
3397     }
3398 }
3399
3400 /* Compute the classic per loop distance vector.  DDR is the data
3401    dependence relation to build a vector from.  Return false when fail
3402    to represent the data dependence as a distance vector.  */
3403
3404 static bool
3405 build_classic_dist_vector (struct data_dependence_relation *ddr,
3406                            struct loop *loop_nest)
3407 {
3408   bool init_b = false;
3409   int index_carry = DDR_NB_LOOPS (ddr);
3410   lambda_vector dist_v;
3411
3412   if (DDR_ARE_DEPENDENT (ddr) != NULL_TREE)
3413     return false;
3414
3415   if (same_access_functions (ddr))
3416     {
3417       /* Save the 0 vector.  */
3418       dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3419       save_dist_v (ddr, dist_v);
3420
3421       if (constant_access_functions (ddr))
3422         add_distance_for_zero_overlaps (ddr);
3423
3424       if (DDR_NB_LOOPS (ddr) > 1)
3425         add_other_self_distances (ddr);
3426
3427       return true;
3428     }
3429
3430   dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3431   if (!build_classic_dist_vector_1 (ddr, DDR_A (ddr), DDR_B (ddr),
3432                                     dist_v, &init_b, &index_carry))
3433     return false;
3434
3435   /* Save the distance vector if we initialized one.  */
3436   if (init_b)
3437     {
3438       /* Verify a basic constraint: classic distance vectors should
3439          always be lexicographically positive.
3440
3441          Data references are collected in the order of execution of
3442          the program, thus for the following loop
3443
3444          | for (i = 1; i < 100; i++)
3445          |   for (j = 1; j < 100; j++)
3446          |     {
3447          |       t = T[j+1][i-1];  // A
3448          |       T[j][i] = t + 2;  // B
3449          |     }
3450
3451          references are collected following the direction of the wind:
3452          A then B.  The data dependence tests are performed also
3453          following this order, such that we're looking at the distance
3454          separating the elements accessed by A from the elements later
3455          accessed by B.  But in this example, the distance returned by
3456          test_dep (A, B) is lexicographically negative (-1, 1), that
3457          means that the access A occurs later than B with respect to
3458          the outer loop, ie. we're actually looking upwind.  In this
3459          case we solve test_dep (B, A) looking downwind to the
3460          lexicographically positive solution, that returns the
3461          distance vector (1, -1).  */
3462       if (!lambda_vector_lexico_pos (dist_v, DDR_NB_LOOPS (ddr)))
3463         {
3464           lambda_vector save_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3465           if (!subscript_dependence_tester_1 (ddr, DDR_B (ddr), DDR_A (ddr),
3466                                               loop_nest))
3467             return false;
3468           compute_subscript_distance (ddr);
3469           if (!build_classic_dist_vector_1 (ddr, DDR_B (ddr), DDR_A (ddr),
3470                                             save_v, &init_b, &index_carry))
3471             return false;
3472           save_dist_v (ddr, save_v);
3473           DDR_REVERSED_P (ddr) = true;
3474
3475           /* In this case there is a dependence forward for all the
3476              outer loops:
3477
3478              | for (k = 1; k < 100; k++)
3479              |  for (i = 1; i < 100; i++)
3480              |   for (j = 1; j < 100; j++)
3481              |     {
3482              |       t = T[j+1][i-1];  // A
3483              |       T[j][i] = t + 2;  // B
3484              |     }
3485
3486              the vectors are:
3487              (0,  1, -1)
3488              (1,  1, -1)
3489              (1, -1,  1)
3490           */
3491           if (DDR_NB_LOOPS (ddr) > 1)
3492             {
3493               add_outer_distances (ddr, save_v, index_carry);
3494               add_outer_distances (ddr, dist_v, index_carry);
3495             }
3496         }
3497       else
3498         {
3499           lambda_vector save_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3500           lambda_vector_copy (dist_v, save_v, DDR_NB_LOOPS (ddr));
3501
3502           if (DDR_NB_LOOPS (ddr) > 1)
3503             {
3504               lambda_vector opposite_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3505
3506               if (!subscript_dependence_tester_1 (ddr, DDR_B (ddr),
3507                                                   DDR_A (ddr), loop_nest))
3508                 return false;
3509               compute_subscript_distance (ddr);
3510               if (!build_classic_dist_vector_1 (ddr, DDR_B (ddr), DDR_A (ddr),
3511                                                 opposite_v, &init_b,
3512                                                 &index_carry))
3513                 return false;
3514
3515               save_dist_v (ddr, save_v);
3516               add_outer_distances (ddr, dist_v, index_carry);
3517               add_outer_distances (ddr, opposite_v, index_carry);
3518             }
3519           else
3520             save_dist_v (ddr, save_v);
3521         }
3522     }
3523   else
3524     {
3525       /* There is a distance of 1 on all the outer loops: Example:
3526          there is a dependence of distance 1 on loop_1 for the array A.
3527
3528          | loop_1
3529          |   A[5] = ...
3530          | endloop
3531       */
3532       add_outer_distances (ddr, dist_v,
3533                            lambda_vector_first_nz (dist_v,
3534                                                    DDR_NB_LOOPS (ddr), 0));
3535     }
3536
3537   if (dump_file && (dump_flags & TDF_DETAILS))
3538     {
3539       unsigned i;
3540
3541       fprintf (dump_file, "(build_classic_dist_vector\n");
3542       for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
3543         {
3544           fprintf (dump_file, "  dist_vector = (");
3545           print_lambda_vector (dump_file, DDR_DIST_VECT (ddr, i),
3546                                DDR_NB_LOOPS (ddr));
3547           fprintf (dump_file, "  )\n");
3548         }
3549       fprintf (dump_file, ")\n");
3550     }
3551
3552   return true;
3553 }
3554
3555 /* Return the direction for a given distance.
3556    FIXME: Computing dir this way is suboptimal, since dir can catch
3557    cases that dist is unable to represent.  */
3558
3559 static inline enum data_dependence_direction
3560 dir_from_dist (int dist)
3561 {
3562   if (dist > 0)
3563     return dir_positive;
3564   else if (dist < 0)
3565     return dir_negative;
3566   else
3567     return dir_equal;
3568 }
3569
3570 /* Compute the classic per loop direction vector.  DDR is the data
3571    dependence relation to build a vector from.  */
3572
3573 static void
3574 build_classic_dir_vector (struct data_dependence_relation *ddr)
3575 {
3576   unsigned i, j;
3577   lambda_vector dist_v;
3578
3579   FOR_EACH_VEC_ELT (DDR_DIST_VECTS (ddr), i, dist_v)
3580     {
3581       lambda_vector dir_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3582
3583       for (j = 0; j < DDR_NB_LOOPS (ddr); j++)
3584         dir_v[j] = dir_from_dist (dist_v[j]);
3585
3586       save_dir_v (ddr, dir_v);
3587     }
3588 }
3589
3590 /* Helper function.  Returns true when there is a dependence between
3591    data references DRA and DRB.  */
3592
3593 static bool
3594 subscript_dependence_tester_1 (struct data_dependence_relation *ddr,
3595                                struct data_reference *dra,
3596                                struct data_reference *drb,
3597                                struct loop *loop_nest)
3598 {
3599   unsigned int i;
3600   tree last_conflicts;
3601   struct subscript *subscript;
3602   tree res = NULL_TREE;
3603
3604   for (i = 0; DDR_SUBSCRIPTS (ddr).iterate (i, &subscript); i++)
3605     {
3606       conflict_function *overlaps_a, *overlaps_b;
3607
3608       analyze_overlapping_iterations (DR_ACCESS_FN (dra, i),
3609                                       DR_ACCESS_FN (drb, i),
3610                                       &overlaps_a, &overlaps_b,
3611                                       &last_conflicts, loop_nest);
3612
3613       if (SUB_CONFLICTS_IN_A (subscript))
3614         free_conflict_function (SUB_CONFLICTS_IN_A (subscript));
3615       if (SUB_CONFLICTS_IN_B (subscript))
3616         free_conflict_function (SUB_CONFLICTS_IN_B (subscript));
3617
3618       SUB_CONFLICTS_IN_A (subscript) = overlaps_a;
3619       SUB_CONFLICTS_IN_B (subscript) = overlaps_b;
3620       SUB_LAST_CONFLICT (subscript) = last_conflicts;
3621
3622       /* If there is any undetermined conflict function we have to
3623          give a conservative answer in case we cannot prove that
3624          no dependence exists when analyzing another subscript.  */
3625       if (CF_NOT_KNOWN_P (overlaps_a)
3626           || CF_NOT_KNOWN_P (overlaps_b))
3627         {
3628           res = chrec_dont_know;
3629           continue;
3630         }
3631
3632       /* When there is a subscript with no dependence we can stop.  */
3633       else if (CF_NO_DEPENDENCE_P (overlaps_a)
3634                || CF_NO_DEPENDENCE_P (overlaps_b))
3635         {
3636           res = chrec_known;
3637           break;
3638         }
3639     }
3640
3641   if (res == NULL_TREE)
3642     return true;
3643
3644   if (res == chrec_known)
3645     dependence_stats.num_dependence_independent++;
3646   else
3647     dependence_stats.num_dependence_undetermined++;
3648   finalize_ddr_dependent (ddr, res);
3649   return false;
3650 }
3651
3652 /* Computes the conflicting iterations in LOOP_NEST, and initialize DDR.  */
3653
3654 static void
3655 subscript_dependence_tester (struct data_dependence_relation *ddr,
3656                              struct loop *loop_nest)
3657 {
3658   if (subscript_dependence_tester_1 (ddr, DDR_A (ddr), DDR_B (ddr), loop_nest))
3659     dependence_stats.num_dependence_dependent++;
3660
3661   compute_subscript_distance (ddr);
3662   if (build_classic_dist_vector (ddr, loop_nest))
3663     build_classic_dir_vector (ddr);
3664 }
3665
3666 /* Returns true when all the access functions of A are affine or
3667    constant with respect to LOOP_NEST.  */
3668
3669 static bool
3670 access_functions_are_affine_or_constant_p (const struct data_reference *a,
3671                                            const struct loop *loop_nest)
3672 {
3673   unsigned int i;
3674   vec<tree> fns = DR_ACCESS_FNS (a);
3675   tree t;
3676
3677   FOR_EACH_VEC_ELT (fns, i, t)
3678     if (!evolution_function_is_invariant_p (t, loop_nest->num)
3679         && !evolution_function_is_affine_multivariate_p (t, loop_nest->num))
3680       return false;
3681
3682   return true;
3683 }
3684
3685 /* This computes the affine dependence relation between A and B with
3686    respect to LOOP_NEST.  CHREC_KNOWN is used for representing the
3687    independence between two accesses, while CHREC_DONT_KNOW is used
3688    for representing the unknown relation.
3689
3690    Note that it is possible to stop the computation of the dependence
3691    relation the first time we detect a CHREC_KNOWN element for a given
3692    subscript.  */
3693
3694 void
3695 compute_affine_dependence (struct data_dependence_relation *ddr,
3696                            struct loop *loop_nest)
3697 {
3698   struct data_reference *dra = DDR_A (ddr);
3699   struct data_reference *drb = DDR_B (ddr);
3700
3701   if (dump_file && (dump_flags & TDF_DETAILS))
3702     {
3703       fprintf (dump_file, "(compute_affine_dependence\n");
3704       fprintf (dump_file, "  stmt_a: ");
3705       print_gimple_stmt (dump_file, DR_STMT (dra), 0, TDF_SLIM);
3706       fprintf (dump_file, "  stmt_b: ");
3707       print_gimple_stmt (dump_file, DR_STMT (drb), 0, TDF_SLIM);
3708     }
3709
3710   /* Analyze only when the dependence relation is not yet known.  */
3711   if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
3712     {
3713       dependence_stats.num_dependence_tests++;
3714
3715       if (access_functions_are_affine_or_constant_p (dra, loop_nest)
3716           && access_functions_are_affine_or_constant_p (drb, loop_nest))
3717         subscript_dependence_tester (ddr, loop_nest);
3718
3719       /* As a last case, if the dependence cannot be determined, or if
3720          the dependence is considered too difficult to determine, answer
3721          "don't know".  */
3722       else
3723         {
3724           dependence_stats.num_dependence_undetermined++;
3725
3726           if (dump_file && (dump_flags & TDF_DETAILS))
3727             {
3728               fprintf (dump_file, "Data ref a:\n");
3729               dump_data_reference (dump_file, dra);
3730               fprintf (dump_file, "Data ref b:\n");
3731               dump_data_reference (dump_file, drb);
3732               fprintf (dump_file, "affine dependence test not usable: access function not affine or constant.\n");
3733             }
3734           finalize_ddr_dependent (ddr, chrec_dont_know);
3735         }
3736     }
3737
3738   if (dump_file && (dump_flags & TDF_DETAILS))
3739     {
3740       if (DDR_ARE_DEPENDENT (ddr) == chrec_known)
3741         fprintf (dump_file, ") -> no dependence\n");
3742       else if (DDR_ARE_DEPENDENT (ddr) == chrec_dont_know)
3743         fprintf (dump_file, ") -> dependence analysis failed\n");
3744       else
3745         fprintf (dump_file, ")\n");
3746     }
3747 }
3748
3749 /* Compute in DEPENDENCE_RELATIONS the data dependence graph for all
3750    the data references in DATAREFS, in the LOOP_NEST.  When
3751    COMPUTE_SELF_AND_RR is FALSE, don't compute read-read and self
3752    relations.  Return true when successful, i.e. data references number
3753    is small enough to be handled.  */
3754
3755 bool
3756 compute_all_dependences (vec<data_reference_p> datarefs,
3757                          vec<ddr_p> *dependence_relations,
3758                          vec<loop_p> loop_nest,
3759                          bool compute_self_and_rr)
3760 {
3761   struct data_dependence_relation *ddr;
3762   struct data_reference *a, *b;
3763   unsigned int i, j;
3764
3765   if ((int) datarefs.length ()
3766       > PARAM_VALUE (PARAM_LOOP_MAX_DATAREFS_FOR_DATADEPS))
3767     {
3768       struct data_dependence_relation *ddr;
3769
3770       /* Insert a single relation into dependence_relations:
3771          chrec_dont_know.  */
3772       ddr = initialize_data_dependence_relation (NULL, NULL, loop_nest);
3773       dependence_relations->safe_push (ddr);
3774       return false;
3775     }
3776
3777   FOR_EACH_VEC_ELT (datarefs, i, a)
3778     for (j = i + 1; datarefs.iterate (j, &b); j++)
3779       if (DR_IS_WRITE (a) || DR_IS_WRITE (b) || compute_self_and_rr)
3780         {
3781           ddr = initialize_data_dependence_relation (a, b, loop_nest);
3782           dependence_relations->safe_push (ddr);
3783           if (loop_nest.exists ())
3784             compute_affine_dependence (ddr, loop_nest[0]);
3785         }
3786
3787   if (compute_self_and_rr)
3788     FOR_EACH_VEC_ELT (datarefs, i, a)
3789       {
3790         ddr = initialize_data_dependence_relation (a, a, loop_nest);
3791         dependence_relations->safe_push (ddr);
3792         if (loop_nest.exists ())
3793           compute_affine_dependence (ddr, loop_nest[0]);
3794       }
3795
3796   return true;
3797 }
3798
3799 /* Describes a location of a memory reference.  */
3800
3801 struct data_ref_loc
3802 {
3803   /* The memory reference.  */
3804   tree ref;
3805
3806   /* True if the memory reference is read.  */
3807   bool is_read;
3808 };
3809
3810
3811 /* Stores the locations of memory references in STMT to REFERENCES.  Returns
3812    true if STMT clobbers memory, false otherwise.  */
3813
3814 static bool
3815 get_references_in_stmt (gimple stmt, vec<data_ref_loc, va_heap> *references)
3816 {
3817   bool clobbers_memory = false;
3818   data_ref_loc ref;
3819   tree op0, op1;
3820   enum gimple_code stmt_code = gimple_code (stmt);
3821
3822   /* ASM_EXPR and CALL_EXPR may embed arbitrary side effects.
3823      As we cannot model data-references to not spelled out
3824      accesses give up if they may occur.  */
3825   if (stmt_code == GIMPLE_CALL
3826       && !(gimple_call_flags (stmt) & ECF_CONST))
3827     {
3828       /* Allow IFN_GOMP_SIMD_LANE in their own loops.  */
3829       if (gimple_call_internal_p (stmt))
3830         switch (gimple_call_internal_fn (stmt))
3831           {
3832           case IFN_GOMP_SIMD_LANE:
3833             {
3834               struct loop *loop = gimple_bb (stmt)->loop_father;
3835               tree uid = gimple_call_arg (stmt, 0);
3836               gcc_assert (TREE_CODE (uid) == SSA_NAME);
3837               if (loop == NULL
3838                   || loop->simduid != SSA_NAME_VAR (uid))
3839                 clobbers_memory = true;
3840               break;
3841             }
3842           case IFN_MASK_LOAD:
3843           case IFN_MASK_STORE:
3844             break;
3845           default:
3846             clobbers_memory = true;
3847             break;
3848           }
3849       else
3850         clobbers_memory = true;
3851     }
3852   else if (stmt_code == GIMPLE_ASM
3853            && (gimple_asm_volatile_p (as_a <gasm *> (stmt))
3854                || gimple_vuse (stmt)))
3855     clobbers_memory = true;
3856
3857   if (!gimple_vuse (stmt))
3858     return clobbers_memory;
3859
3860   if (stmt_code == GIMPLE_ASSIGN)
3861     {
3862       tree base;
3863       op0 = gimple_assign_lhs (stmt);
3864       op1 = gimple_assign_rhs1 (stmt);
3865
3866       if (DECL_P (op1)
3867           || (REFERENCE_CLASS_P (op1)
3868               && (base = get_base_address (op1))
3869               && TREE_CODE (base) != SSA_NAME))
3870         {
3871           ref.ref = op1;
3872           ref.is_read = true;
3873           references->safe_push (ref);
3874         }
3875     }
3876   else if (stmt_code == GIMPLE_CALL)
3877     {
3878       unsigned i, n;
3879
3880       ref.is_read = false;
3881       if (gimple_call_internal_p (stmt))
3882         switch (gimple_call_internal_fn (stmt))
3883           {
3884           case IFN_MASK_LOAD:
3885             if (gimple_call_lhs (stmt) == NULL_TREE)
3886               break;
3887             ref.is_read = true;
3888           case IFN_MASK_STORE:
3889             ref.ref = fold_build2 (MEM_REF,
3890                                    ref.is_read
3891                                    ? TREE_TYPE (gimple_call_lhs (stmt))
3892                                    : TREE_TYPE (gimple_call_arg (stmt, 3)),
3893                                    gimple_call_arg (stmt, 0),
3894                                    gimple_call_arg (stmt, 1));
3895             references->safe_push (ref);
3896             return false;
3897           default:
3898             break;
3899           }
3900
3901       op0 = gimple_call_lhs (stmt);
3902       n = gimple_call_num_args (stmt);
3903       for (i = 0; i < n; i++)
3904         {
3905           op1 = gimple_call_arg (stmt, i);
3906
3907           if (DECL_P (op1)
3908               || (REFERENCE_CLASS_P (op1) && get_base_address (op1)))
3909             {
3910               ref.ref = op1;
3911               ref.is_read = true;
3912               references->safe_push (ref);
3913             }
3914         }
3915     }
3916   else
3917     return clobbers_memory;
3918
3919   if (op0
3920       && (DECL_P (op0)
3921           || (REFERENCE_CLASS_P (op0) && get_base_address (op0))))
3922     {
3923       ref.ref = op0;
3924       ref.is_read = false;
3925       references->safe_push (ref);
3926     }
3927   return clobbers_memory;
3928 }
3929
3930 /* Stores the data references in STMT to DATAREFS.  If there is an unanalyzable
3931    reference, returns false, otherwise returns true.  NEST is the outermost
3932    loop of the loop nest in which the references should be analyzed.  */
3933
3934 bool
3935 find_data_references_in_stmt (struct loop *nest, gimple stmt,
3936                               vec<data_reference_p> *datarefs)
3937 {
3938   unsigned i;
3939   auto_vec<data_ref_loc, 2> references;
3940   data_ref_loc *ref;
3941   bool ret = true;
3942   data_reference_p dr;
3943
3944   if (get_references_in_stmt (stmt, &references))
3945     return false;
3946
3947   FOR_EACH_VEC_ELT (references, i, ref)
3948     {
3949       dr = create_data_ref (nest, loop_containing_stmt (stmt),
3950                             ref->ref, stmt, ref->is_read);
3951       gcc_assert (dr != NULL);
3952       datarefs->safe_push (dr);
3953     }
3954   references.release ();
3955   return ret;
3956 }
3957
3958 /* Stores the data references in STMT to DATAREFS.  If there is an
3959    unanalyzable reference, returns false, otherwise returns true.
3960    NEST is the outermost loop of the loop nest in which the references
3961    should be instantiated, LOOP is the loop in which the references
3962    should be analyzed.  */
3963
3964 bool
3965 graphite_find_data_references_in_stmt (loop_p nest, loop_p loop, gimple stmt,
3966                                        vec<data_reference_p> *datarefs)
3967 {
3968   unsigned i;
3969   auto_vec<data_ref_loc, 2> references;
3970   data_ref_loc *ref;
3971   bool ret = true;
3972   data_reference_p dr;
3973
3974   if (get_references_in_stmt (stmt, &references))
3975     return false;
3976
3977   FOR_EACH_VEC_ELT (references, i, ref)
3978     {
3979       dr = create_data_ref (nest, loop, ref->ref, stmt, ref->is_read);
3980       gcc_assert (dr != NULL);
3981       datarefs->safe_push (dr);
3982     }
3983
3984   references.release ();
3985   return ret;
3986 }
3987
3988 /* Search the data references in LOOP, and record the information into
3989    DATAREFS.  Returns chrec_dont_know when failing to analyze a
3990    difficult case, returns NULL_TREE otherwise.  */
3991
3992 tree
3993 find_data_references_in_bb (struct loop *loop, basic_block bb,
3994                             vec<data_reference_p> *datarefs)
3995 {
3996   gimple_stmt_iterator bsi;
3997
3998   for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
3999     {
4000       gimple stmt = gsi_stmt (bsi);
4001
4002       if (!find_data_references_in_stmt (loop, stmt, datarefs))
4003         {
4004           struct data_reference *res;
4005           res = XCNEW (struct data_reference);
4006           datarefs->safe_push (res);
4007
4008           return chrec_dont_know;
4009         }
4010     }
4011
4012   return NULL_TREE;
4013 }
4014
4015 /* Search the data references in LOOP, and record the information into
4016    DATAREFS.  Returns chrec_dont_know when failing to analyze a
4017    difficult case, returns NULL_TREE otherwise.
4018
4019    TODO: This function should be made smarter so that it can handle address
4020    arithmetic as if they were array accesses, etc.  */
4021
4022 tree
4023 find_data_references_in_loop (struct loop *loop,
4024                               vec<data_reference_p> *datarefs)
4025 {
4026   basic_block bb, *bbs;
4027   unsigned int i;
4028
4029   bbs = get_loop_body_in_dom_order (loop);
4030
4031   for (i = 0; i < loop->num_nodes; i++)
4032     {
4033       bb = bbs[i];
4034
4035       if (find_data_references_in_bb (loop, bb, datarefs) == chrec_dont_know)
4036         {
4037           free (bbs);
4038           return chrec_dont_know;
4039         }
4040     }
4041   free (bbs);
4042
4043   return NULL_TREE;
4044 }
4045
4046 /* Recursive helper function.  */
4047
4048 static bool
4049 find_loop_nest_1 (struct loop *loop, vec<loop_p> *loop_nest)
4050 {
4051   /* Inner loops of the nest should not contain siblings.  Example:
4052      when there are two consecutive loops,
4053
4054      | loop_0
4055      |   loop_1
4056      |     A[{0, +, 1}_1]
4057      |   endloop_1
4058      |   loop_2
4059      |     A[{0, +, 1}_2]
4060      |   endloop_2
4061      | endloop_0
4062
4063      the dependence relation cannot be captured by the distance
4064      abstraction.  */
4065   if (loop->next)
4066     return false;
4067
4068   loop_nest->safe_push (loop);
4069   if (loop->inner)
4070     return find_loop_nest_1 (loop->inner, loop_nest);
4071   return true;
4072 }
4073
4074 /* Return false when the LOOP is not well nested.  Otherwise return
4075    true and insert in LOOP_NEST the loops of the nest.  LOOP_NEST will
4076    contain the loops from the outermost to the innermost, as they will
4077    appear in the classic distance vector.  */
4078
4079 bool
4080 find_loop_nest (struct loop *loop, vec<loop_p> *loop_nest)
4081 {
4082   loop_nest->safe_push (loop);
4083   if (loop->inner)
4084     return find_loop_nest_1 (loop->inner, loop_nest);
4085   return true;
4086 }
4087
4088 /* Returns true when the data dependences have been computed, false otherwise.
4089    Given a loop nest LOOP, the following vectors are returned:
4090    DATAREFS is initialized to all the array elements contained in this loop,
4091    DEPENDENCE_RELATIONS contains the relations between the data references.
4092    Compute read-read and self relations if
4093    COMPUTE_SELF_AND_READ_READ_DEPENDENCES is TRUE.  */
4094
4095 bool
4096 compute_data_dependences_for_loop (struct loop *loop,
4097                                    bool compute_self_and_read_read_dependences,
4098                                    vec<loop_p> *loop_nest,
4099                                    vec<data_reference_p> *datarefs,
4100                                    vec<ddr_p> *dependence_relations)
4101 {
4102   bool res = true;
4103
4104   memset (&dependence_stats, 0, sizeof (dependence_stats));
4105
4106   /* If the loop nest is not well formed, or one of the data references
4107      is not computable, give up without spending time to compute other
4108      dependences.  */
4109   if (!loop
4110       || !find_loop_nest (loop, loop_nest)
4111       || find_data_references_in_loop (loop, datarefs) == chrec_dont_know
4112       || !compute_all_dependences (*datarefs, dependence_relations, *loop_nest,
4113                                    compute_self_and_read_read_dependences))
4114     res = false;
4115
4116   if (dump_file && (dump_flags & TDF_STATS))
4117     {
4118       fprintf (dump_file, "Dependence tester statistics:\n");
4119
4120       fprintf (dump_file, "Number of dependence tests: %d\n",
4121                dependence_stats.num_dependence_tests);
4122       fprintf (dump_file, "Number of dependence tests classified dependent: %d\n",
4123                dependence_stats.num_dependence_dependent);
4124       fprintf (dump_file, "Number of dependence tests classified independent: %d\n",
4125                dependence_stats.num_dependence_independent);
4126       fprintf (dump_file, "Number of undetermined dependence tests: %d\n",
4127                dependence_stats.num_dependence_undetermined);
4128
4129       fprintf (dump_file, "Number of subscript tests: %d\n",
4130                dependence_stats.num_subscript_tests);
4131       fprintf (dump_file, "Number of undetermined subscript tests: %d\n",
4132                dependence_stats.num_subscript_undetermined);
4133       fprintf (dump_file, "Number of same subscript function: %d\n",
4134                dependence_stats.num_same_subscript_function);
4135
4136       fprintf (dump_file, "Number of ziv tests: %d\n",
4137                dependence_stats.num_ziv);
4138       fprintf (dump_file, "Number of ziv tests returning dependent: %d\n",
4139                dependence_stats.num_ziv_dependent);
4140       fprintf (dump_file, "Number of ziv tests returning independent: %d\n",
4141                dependence_stats.num_ziv_independent);
4142       fprintf (dump_file, "Number of ziv tests unimplemented: %d\n",
4143                dependence_stats.num_ziv_unimplemented);
4144
4145       fprintf (dump_file, "Number of siv tests: %d\n",
4146                dependence_stats.num_siv);
4147       fprintf (dump_file, "Number of siv tests returning dependent: %d\n",
4148                dependence_stats.num_siv_dependent);
4149       fprintf (dump_file, "Number of siv tests returning independent: %d\n",
4150                dependence_stats.num_siv_independent);
4151       fprintf (dump_file, "Number of siv tests unimplemented: %d\n",
4152                dependence_stats.num_siv_unimplemented);
4153
4154       fprintf (dump_file, "Number of miv tests: %d\n",
4155                dependence_stats.num_miv);
4156       fprintf (dump_file, "Number of miv tests returning dependent: %d\n",
4157                dependence_stats.num_miv_dependent);
4158       fprintf (dump_file, "Number of miv tests returning independent: %d\n",
4159                dependence_stats.num_miv_independent);
4160       fprintf (dump_file, "Number of miv tests unimplemented: %d\n",
4161                dependence_stats.num_miv_unimplemented);
4162     }
4163
4164   return res;
4165 }
4166
4167 /* Free the memory used by a data dependence relation DDR.  */
4168
4169 void
4170 free_dependence_relation (struct data_dependence_relation *ddr)
4171 {
4172   if (ddr == NULL)
4173     return;
4174
4175   if (DDR_SUBSCRIPTS (ddr).exists ())
4176     free_subscripts (DDR_SUBSCRIPTS (ddr));
4177   DDR_DIST_VECTS (ddr).release ();
4178   DDR_DIR_VECTS (ddr).release ();
4179
4180   free (ddr);
4181 }
4182
4183 /* Free the memory used by the data dependence relations from
4184    DEPENDENCE_RELATIONS.  */
4185
4186 void
4187 free_dependence_relations (vec<ddr_p> dependence_relations)
4188 {
4189   unsigned int i;
4190   struct data_dependence_relation *ddr;
4191
4192   FOR_EACH_VEC_ELT (dependence_relations, i, ddr)
4193     if (ddr)
4194       free_dependence_relation (ddr);
4195
4196   dependence_relations.release ();
4197 }
4198
4199 /* Free the memory used by the data references from DATAREFS.  */
4200
4201 void
4202 free_data_refs (vec<data_reference_p> datarefs)
4203 {
4204   unsigned int i;
4205   struct data_reference *dr;
4206
4207   FOR_EACH_VEC_ELT (datarefs, i, dr)
4208     free_data_ref (dr);
4209   datarefs.release ();
4210 }