gcc/tree-data-ref.c

   1 /* Data references and dependences detectors.
   2    Copyright (C) 2003-2015 Free Software Foundation, Inc.
   3    Contributed by Sebastian Pop <pop@cri.ensmp.fr>
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 3, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 /* This pass walks a given loop structure searching for array
  22    references.  The information about the array accesses is recorded
  23    in DATA_REFERENCE structures.
  24
  25    The basic test for determining the dependences is:
  26    given two access functions chrec1 and chrec2 to a same array, and
  27    x and y two vectors from the iteration domain, the same element of
  28    the array is accessed twice at iterations x and y if and only if:
  29    |             chrec1 (x) == chrec2 (y).
  30
  31    The goals of this analysis are:
  32
  33    - to determine the independence: the relation between two
  34      independent accesses is qualified with the chrec_known (this
  35      information allows a loop parallelization),
  36
  37    - when two data references access the same data, to qualify the
  38      dependence relation with classic dependence representations:
  39
  40        - distance vectors
  41        - direction vectors
  42        - loop carried level dependence
  43        - polyhedron dependence
  44      or with the chains of recurrences based representation,
  45
  46    - to define a knowledge base for storing the data dependence
  47      information,
  48
  49    - to define an interface to access this data.
  50
  51
  52    Definitions:
  53
  54    - subscript: given two array accesses a subscript is the tuple
  55    composed of the access functions for a given dimension.  Example:
  56    Given A[f1][f2][f3] and B[g1][g2][g3], there are three subscripts:
  57    (f1, g1), (f2, g2), (f3, g3).
  58
  59    - Diophantine equation: an equation whose coefficients and
  60    solutions are integer constants, for example the equation
  61    |   3*x + 2*y = 1
  62    has an integer solution x = 1 and y = -1.
  63
  64    References:
  65
  66    - "Advanced Compilation for High Performance Computing" by Randy
  67    Allen and Ken Kennedy.
  68    http://citeseer.ist.psu.edu/goff91practical.html
  69
  70    - "Loop Transformations for Restructuring Compilers - The Foundations"
  71    by Utpal Banerjee.
  72
  73
  74 */
  75
  76 #include "config.h"
  77 #include "system.h"
  78 #include "coretypes.h"
  79 #include "input.h"
  80 #include "alias.h"
  81 #include "symtab.h"
  82 #include "options.h"
  83 #include "tree.h"
  84 #include "fold-const.h"
  85 #include "tm.h"
  86 #include "hard-reg-set.h"
  87 #include "function.h"
  88 #include "rtl.h"
  89 #include "flags.h"
  90 #include "insn-config.h"
  91 #include "expmed.h"
  92 #include "dojump.h"
  93 #include "explow.h"
  94 #include "calls.h"
  95 #include "emit-rtl.h"
  96 #include "varasm.h"
  97 #include "stmt.h"
  98 #include "expr.h"
  99 #include "gimple-pretty-print.h"
 100 #include "predict.h"
 101 #include "dominance.h"
 102 #include "cfg.h"
 103 #include "basic-block.h"
 104 #include "tree-ssa-alias.h"
 105 #include "internal-fn.h"
 106 #include "gimple-expr.h"
 107 #include "is-a.h"
 108 #include "gimple.h"
 109 #include "gimple-iterator.h"
 110 #include "tree-ssa-loop-niter.h"
 111 #include "tree-ssa-loop.h"
 112 #include "tree-ssa.h"
 113 #include "cfgloop.h"
 114 #include "tree-data-ref.h"
 115 #include "tree-scalar-evolution.h"
 116 #include "dumpfile.h"
 117 #include "langhooks.h"
 118 #include "tree-affine.h"
 119 #include "params.h"
 120
 121 static struct datadep_stats
 122 {
 123   int num_dependence_tests;
 124   int num_dependence_dependent;
 125   int num_dependence_independent;
 126   int num_dependence_undetermined;
 127
 128   int num_subscript_tests;
 129   int num_subscript_undetermined;
 130   int num_same_subscript_function;
 131
 132   int num_ziv;
 133   int num_ziv_independent;
 134   int num_ziv_dependent;
 135   int num_ziv_unimplemented;
 136
 137   int num_siv;
 138   int num_siv_independent;
 139   int num_siv_dependent;
 140   int num_siv_unimplemented;
 141
 142   int num_miv;
 143   int num_miv_independent;
 144   int num_miv_dependent;
 145   int num_miv_unimplemented;
 146 } dependence_stats;
 147
 148 static bool subscript_dependence_tester_1 (struct data_dependence_relation *,
 149                                            struct data_reference *,
 150                                            struct data_reference *,
 151                                            struct loop *);
 152 /* Returns true iff A divides B.  */
 153
 154 static inline bool
 155 tree_fold_divides_p (const_tree a, const_tree b)
 156 {
 157   gcc_assert (TREE_CODE (a) == INTEGER_CST);
 158   gcc_assert (TREE_CODE (b) == INTEGER_CST);
 159   return integer_zerop (int_const_binop (TRUNC_MOD_EXPR, b, a));
 160 }
 161
 162 /* Returns true iff A divides B.  */
 163
 164 static inline bool
 165 int_divides_p (int a, int b)
 166 {
 167   return ((b % a) == 0);
 168 }
 169
 170 \f
 171
 172 /* Dump into FILE all the data references from DATAREFS.  */
 173
 174 static void
 175 dump_data_references (FILE *file, vec<data_reference_p> datarefs)
 176 {
 177   unsigned int i;
 178   struct data_reference *dr;
 179
 180   FOR_EACH_VEC_ELT (datarefs, i, dr)
 181     dump_data_reference (file, dr);
 182 }
 183
 184 /* Unified dump into FILE all the data references from DATAREFS.  */
 185
 186 DEBUG_FUNCTION void
 187 debug (vec<data_reference_p> &ref)
 188 {
 189   dump_data_references (stderr, ref);
 190 }
 191
 192 DEBUG_FUNCTION void
 193 debug (vec<data_reference_p> *ptr)
 194 {
 195   if (ptr)
 196     debug (*ptr);
 197   else
 198     fprintf (stderr, "<nil>\n");
 199 }
 200
 201
 202 /* Dump into STDERR all the data references from DATAREFS.  */
 203
 204 DEBUG_FUNCTION void
 205 debug_data_references (vec<data_reference_p> datarefs)
 206 {
 207   dump_data_references (stderr, datarefs);
 208 }
 209
 210 /* Print to STDERR the data_reference DR.  */
 211
 212 DEBUG_FUNCTION void
 213 debug_data_reference (struct data_reference *dr)
 214 {
 215   dump_data_reference (stderr, dr);
 216 }
 217
 218 /* Dump function for a DATA_REFERENCE structure.  */
 219
 220 void
 221 dump_data_reference (FILE *outf,
 222                      struct data_reference *dr)
 223 {
 224   unsigned int i;
 225
 226   fprintf (outf, "#(Data Ref: \n");
 227   fprintf (outf, "#  bb: %d \n", gimple_bb (DR_STMT (dr))->index);
 228   fprintf (outf, "#  stmt: ");
 229   print_gimple_stmt (outf, DR_STMT (dr), 0, 0);
 230   fprintf (outf, "#  ref: ");
 231   print_generic_stmt (outf, DR_REF (dr), 0);
 232   fprintf (outf, "#  base_object: ");
 233   print_generic_stmt (outf, DR_BASE_OBJECT (dr), 0);
 234
 235   for (i = 0; i < DR_NUM_DIMENSIONS (dr); i++)
 236     {
 237       fprintf (outf, "#  Access function %d: ", i);
 238       print_generic_stmt (outf, DR_ACCESS_FN (dr, i), 0);
 239     }
 240   fprintf (outf, "#)\n");
 241 }
 242
 243 /* Unified dump function for a DATA_REFERENCE structure.  */
 244
 245 DEBUG_FUNCTION void
 246 debug (data_reference &ref)
 247 {
 248   dump_data_reference (stderr, &ref);
 249 }
 250
 251 DEBUG_FUNCTION void
 252 debug (data_reference *ptr)
 253 {
 254   if (ptr)
 255     debug (*ptr);
 256   else
 257     fprintf (stderr, "<nil>\n");
 258 }
 259
 260
 261 /* Dumps the affine function described by FN to the file OUTF.  */
 262
 263 static void
 264 dump_affine_function (FILE *outf, affine_fn fn)
 265 {
 266   unsigned i;
 267   tree coef;
 268
 269   print_generic_expr (outf, fn[0], TDF_SLIM);
 270   for (i = 1; fn.iterate (i, &coef); i++)
 271     {
 272       fprintf (outf, " + ");
 273       print_generic_expr (outf, coef, TDF_SLIM);
 274       fprintf (outf, " * x_%u", i);
 275     }
 276 }
 277
 278 /* Dumps the conflict function CF to the file OUTF.  */
 279
 280 static void
 281 dump_conflict_function (FILE *outf, conflict_function *cf)
 282 {
 283   unsigned i;
 284
 285   if (cf->n == NO_DEPENDENCE)
 286     fprintf (outf, "no dependence");
 287   else if (cf->n == NOT_KNOWN)
 288     fprintf (outf, "not known");
 289   else
 290     {
 291       for (i = 0; i < cf->n; i++)
 292         {
 293           if (i != 0)
 294             fprintf (outf, " ");
 295           fprintf (outf, "[");
 296           dump_affine_function (outf, cf->fns[i]);
 297           fprintf (outf, "]");
 298         }
 299     }
 300 }
 301
 302 /* Dump function for a SUBSCRIPT structure.  */
 303
 304 static void
 305 dump_subscript (FILE *outf, struct subscript *subscript)
 306 {
 307   conflict_function *cf = SUB_CONFLICTS_IN_A (subscript);
 308
 309   fprintf (outf, "\n (subscript \n");
 310   fprintf (outf, "  iterations_that_access_an_element_twice_in_A: ");
 311   dump_conflict_function (outf, cf);
 312   if (CF_NONTRIVIAL_P (cf))
 313     {
 314       tree last_iteration = SUB_LAST_CONFLICT (subscript);
 315       fprintf (outf, "\n  last_conflict: ");
 316       print_generic_expr (outf, last_iteration, 0);
 317     }
 318
 319   cf = SUB_CONFLICTS_IN_B (subscript);
 320   fprintf (outf, "\n  iterations_that_access_an_element_twice_in_B: ");
 321   dump_conflict_function (outf, cf);
 322   if (CF_NONTRIVIAL_P (cf))
 323     {
 324       tree last_iteration = SUB_LAST_CONFLICT (subscript);
 325       fprintf (outf, "\n  last_conflict: ");
 326       print_generic_expr (outf, last_iteration, 0);
 327     }
 328
 329   fprintf (outf, "\n  (Subscript distance: ");
 330   print_generic_expr (outf, SUB_DISTANCE (subscript), 0);
 331   fprintf (outf, " ))\n");
 332 }
 333
 334 /* Print the classic direction vector DIRV to OUTF.  */
 335
 336 static void
 337 print_direction_vector (FILE *outf,
 338                         lambda_vector dirv,
 339                         int length)
 340 {
 341   int eq;
 342
 343   for (eq = 0; eq < length; eq++)
 344     {
 345       enum data_dependence_direction dir = ((enum data_dependence_direction)
 346                                             dirv[eq]);
 347
 348       switch (dir)
 349         {
 350         case dir_positive:
 351           fprintf (outf, "    +");
 352           break;
 353         case dir_negative:
 354           fprintf (outf, "    -");
 355           break;
 356         case dir_equal:
 357           fprintf (outf, "    =");
 358           break;
 359         case dir_positive_or_equal:
 360           fprintf (outf, "   +=");
 361           break;
 362         case dir_positive_or_negative:
 363           fprintf (outf, "   +-");
 364           break;
 365         case dir_negative_or_equal:
 366           fprintf (outf, "   -=");
 367           break;
 368         case dir_star:
 369           fprintf (outf, "    *");
 370           break;
 371         default:
 372           fprintf (outf, "indep");
 373           break;
 374         }
 375     }
 376   fprintf (outf, "\n");
 377 }
 378
 379 /* Print a vector of direction vectors.  */
 380
 381 static void
 382 print_dir_vectors (FILE *outf, vec<lambda_vector> dir_vects,
 383                    int length)
 384 {
 385   unsigned j;
 386   lambda_vector v;
 387
 388   FOR_EACH_VEC_ELT (dir_vects, j, v)
 389     print_direction_vector (outf, v, length);
 390 }
 391
 392 /* Print out a vector VEC of length N to OUTFILE.  */
 393
 394 static inline void
 395 print_lambda_vector (FILE * outfile, lambda_vector vector, int n)
 396 {
 397   int i;
 398
 399   for (i = 0; i < n; i++)
 400     fprintf (outfile, "%3d ", vector[i]);
 401   fprintf (outfile, "\n");
 402 }
 403
 404 /* Print a vector of distance vectors.  */
 405
 406 static void
 407 print_dist_vectors (FILE *outf, vec<lambda_vector> dist_vects,
 408                     int length)
 409 {
 410   unsigned j;
 411   lambda_vector v;
 412
 413   FOR_EACH_VEC_ELT (dist_vects, j, v)
 414     print_lambda_vector (outf, v, length);
 415 }
 416
 417 /* Dump function for a DATA_DEPENDENCE_RELATION structure.  */
 418
 419 static void
 420 dump_data_dependence_relation (FILE *outf,
 421                                struct data_dependence_relation *ddr)
 422 {
 423   struct data_reference *dra, *drb;
 424
 425   fprintf (outf, "(Data Dep: \n");
 426
 427   if (!ddr || DDR_ARE_DEPENDENT (ddr) == chrec_dont_know)
 428     {
 429       if (ddr)
 430         {
 431           dra = DDR_A (ddr);
 432           drb = DDR_B (ddr);
 433           if (dra)
 434             dump_data_reference (outf, dra);
 435           else
 436             fprintf (outf, "    (nil)\n");
 437           if (drb)
 438             dump_data_reference (outf, drb);
 439           else
 440             fprintf (outf, "    (nil)\n");
 441         }
 442       fprintf (outf, "    (don't know)\n)\n");
 443       return;
 444     }
 445
 446   dra = DDR_A (ddr);
 447   drb = DDR_B (ddr);
 448   dump_data_reference (outf, dra);
 449   dump_data_reference (outf, drb);
 450
 451   if (DDR_ARE_DEPENDENT (ddr) == chrec_known)
 452     fprintf (outf, "    (no dependence)\n");
 453
 454   else if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
 455     {
 456       unsigned int i;
 457       struct loop *loopi;
 458
 459       for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
 460         {
 461           fprintf (outf, "  access_fn_A: ");
 462           print_generic_stmt (outf, DR_ACCESS_FN (dra, i), 0);
 463           fprintf (outf, "  access_fn_B: ");
 464           print_generic_stmt (outf, DR_ACCESS_FN (drb, i), 0);
 465           dump_subscript (outf, DDR_SUBSCRIPT (ddr, i));
 466         }
 467
 468       fprintf (outf, "  inner loop index: %d\n", DDR_INNER_LOOP (ddr));
 469       fprintf (outf, "  loop nest: (");
 470       FOR_EACH_VEC_ELT (DDR_LOOP_NEST (ddr), i, loopi)
 471         fprintf (outf, "%d ", loopi->num);
 472       fprintf (outf, ")\n");
 473
 474       for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
 475         {
 476           fprintf (outf, "  distance_vector: ");
 477           print_lambda_vector (outf, DDR_DIST_VECT (ddr, i),
 478                                DDR_NB_LOOPS (ddr));
 479         }
 480
 481       for (i = 0; i < DDR_NUM_DIR_VECTS (ddr); i++)
 482         {
 483           fprintf (outf, "  direction_vector: ");
 484           print_direction_vector (outf, DDR_DIR_VECT (ddr, i),
 485                                   DDR_NB_LOOPS (ddr));
 486         }
 487     }
 488
 489   fprintf (outf, ")\n");
 490 }
 491
 492 /* Debug version.  */
 493
 494 DEBUG_FUNCTION void
 495 debug_data_dependence_relation (struct data_dependence_relation *ddr)
 496 {
 497   dump_data_dependence_relation (stderr, ddr);
 498 }
 499
 500 /* Dump into FILE all the dependence relations from DDRS.  */
 501
 502 void
 503 dump_data_dependence_relations (FILE *file,
 504                                 vec<ddr_p> ddrs)
 505 {
 506   unsigned int i;
 507   struct data_dependence_relation *ddr;
 508
 509   FOR_EACH_VEC_ELT (ddrs, i, ddr)
 510     dump_data_dependence_relation (file, ddr);
 511 }
 512
 513 DEBUG_FUNCTION void
 514 debug (vec<ddr_p> &ref)
 515 {
 516   dump_data_dependence_relations (stderr, ref);
 517 }
 518
 519 DEBUG_FUNCTION void
 520 debug (vec<ddr_p> *ptr)
 521 {
 522   if (ptr)
 523     debug (*ptr);
 524   else
 525     fprintf (stderr, "<nil>\n");
 526 }
 527
 528
 529 /* Dump to STDERR all the dependence relations from DDRS.  */
 530
 531 DEBUG_FUNCTION void
 532 debug_data_dependence_relations (vec<ddr_p> ddrs)
 533 {
 534   dump_data_dependence_relations (stderr, ddrs);
 535 }
 536
 537 /* Dumps the distance and direction vectors in FILE.  DDRS contains
 538    the dependence relations, and VECT_SIZE is the size of the
 539    dependence vectors, or in other words the number of loops in the
 540    considered nest.  */
 541
 542 static void
 543 dump_dist_dir_vectors (FILE *file, vec<ddr_p> ddrs)
 544 {
 545   unsigned int i, j;
 546   struct data_dependence_relation *ddr;
 547   lambda_vector v;
 548
 549   FOR_EACH_VEC_ELT (ddrs, i, ddr)
 550     if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE && DDR_AFFINE_P (ddr))
 551       {
 552         FOR_EACH_VEC_ELT (DDR_DIST_VECTS (ddr), j, v)
 553           {
 554             fprintf (file, "DISTANCE_V (");
 555             print_lambda_vector (file, v, DDR_NB_LOOPS (ddr));
 556             fprintf (file, ")\n");
 557           }
 558
 559         FOR_EACH_VEC_ELT (DDR_DIR_VECTS (ddr), j, v)
 560           {
 561             fprintf (file, "DIRECTION_V (");
 562             print_direction_vector (file, v, DDR_NB_LOOPS (ddr));
 563             fprintf (file, ")\n");
 564           }
 565       }
 566
 567   fprintf (file, "\n\n");
 568 }
 569
 570 /* Dumps the data dependence relations DDRS in FILE.  */
 571
 572 static void
 573 dump_ddrs (FILE *file, vec<ddr_p> ddrs)
 574 {
 575   unsigned int i;
 576   struct data_dependence_relation *ddr;
 577
 578   FOR_EACH_VEC_ELT (ddrs, i, ddr)
 579     dump_data_dependence_relation (file, ddr);
 580
 581   fprintf (file, "\n\n");
 582 }
 583
 584 DEBUG_FUNCTION void
 585 debug_ddrs (vec<ddr_p> ddrs)
 586 {
 587   dump_ddrs (stderr, ddrs);
 588 }
 589
 590 /* Helper function for split_constant_offset.  Expresses OP0 CODE OP1
 591    (the type of the result is TYPE) as VAR + OFF, where OFF is a nonzero
 592    constant of type ssizetype, and returns true.  If we cannot do this
 593    with OFF nonzero, OFF and VAR are set to NULL_TREE instead and false
 594    is returned.  */
 595
 596 static bool
 597 split_constant_offset_1 (tree type, tree op0, enum tree_code code, tree op1,
 598                          tree *var, tree *off)
 599 {
 600   tree var0, var1;
 601   tree off0, off1;
 602   enum tree_code ocode = code;
 603
 604   *var = NULL_TREE;
 605   *off = NULL_TREE;
 606
 607   switch (code)
 608     {
 609     case INTEGER_CST:
 610       *var = build_int_cst (type, 0);
 611       *off = fold_convert (ssizetype, op0);
 612       return true;
 613
 614     case POINTER_PLUS_EXPR:
 615       ocode = PLUS_EXPR;
 616       /* FALLTHROUGH */
 617     case PLUS_EXPR:
 618     case MINUS_EXPR:
 619       split_constant_offset (op0, &var0, &off0);
 620       split_constant_offset (op1, &var1, &off1);
 621       *var = fold_build2 (code, type, var0, var1);
 622       *off = size_binop (ocode, off0, off1);
 623       return true;
 624
 625     case MULT_EXPR:
 626       if (TREE_CODE (op1) != INTEGER_CST)
 627         return false;
 628
 629       split_constant_offset (op0, &var0, &off0);
 630       *var = fold_build2 (MULT_EXPR, type, var0, op1);
 631       *off = size_binop (MULT_EXPR, off0, fold_convert (ssizetype, op1));
 632       return true;
 633
 634     case ADDR_EXPR:
 635       {
 636         tree base, poffset;
 637         HOST_WIDE_INT pbitsize, pbitpos;
 638         machine_mode pmode;
 639         int punsignedp, preversep, pvolatilep;
 640
 641         op0 = TREE_OPERAND (op0, 0);
 642         base
 643           = get_inner_reference (op0, &pbitsize, &pbitpos, &poffset, &pmode,
 644                                  &punsignedp, &preversep, &pvolatilep, false);
 645
 646         if (pbitpos % BITS_PER_UNIT != 0)
 647           return false;
 648         base = build_fold_addr_expr (base);
 649         off0 = ssize_int (pbitpos / BITS_PER_UNIT);
 650
 651         if (poffset)
 652           {
 653             split_constant_offset (poffset, &poffset, &off1);
 654             off0 = size_binop (PLUS_EXPR, off0, off1);
 655             if (POINTER_TYPE_P (TREE_TYPE (base)))
 656               base = fold_build_pointer_plus (base, poffset);
 657             else
 658               base = fold_build2 (PLUS_EXPR, TREE_TYPE (base), base,
 659                                   fold_convert (TREE_TYPE (base), poffset));
 660           }
 661
 662         var0 = fold_convert (type, base);
 663
 664         /* If variable length types are involved, punt, otherwise casts
 665            might be converted into ARRAY_REFs in gimplify_conversion.
 666            To compute that ARRAY_REF's element size TYPE_SIZE_UNIT, which
 667            possibly no longer appears in current GIMPLE, might resurface.
 668            This perhaps could run
 669            if (CONVERT_EXPR_P (var0))
 670              {
 671                gimplify_conversion (&var0);
 672                // Attempt to fill in any within var0 found ARRAY_REF's
 673                // element size from corresponding op embedded ARRAY_REF,
 674                // if unsuccessful, just punt.
 675              }  */
 676         while (POINTER_TYPE_P (type))
 677           type = TREE_TYPE (type);
 678         if (int_size_in_bytes (type) < 0)
 679           return false;
 680
 681         *var = var0;
 682         *off = off0;
 683         return true;
 684       }
 685
 686     case SSA_NAME:
 687       {
 688         if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (op0))
 689           return false;
 690
 691         gimple def_stmt = SSA_NAME_DEF_STMT (op0);
 692         enum tree_code subcode;
 693
 694         if (gimple_code (def_stmt) != GIMPLE_ASSIGN)
 695           return false;
 696
 697         var0 = gimple_assign_rhs1 (def_stmt);
 698         subcode = gimple_assign_rhs_code (def_stmt);
 699         var1 = gimple_assign_rhs2 (def_stmt);
 700
 701         return split_constant_offset_1 (type, var0, subcode, var1, var, off);
 702       }
 703     CASE_CONVERT:
 704       {
 705         /* We must not introduce undefined overflow, and we must not change the value.
 706            Hence we're okay if the inner type doesn't overflow to start with
 707            (pointer or signed), the outer type also is an integer or pointer
 708            and the outer precision is at least as large as the inner.  */
 709         tree itype = TREE_TYPE (op0);
 710         if ((POINTER_TYPE_P (itype)
 711              || (INTEGRAL_TYPE_P (itype) && TYPE_OVERFLOW_UNDEFINED (itype)))
 712             && TYPE_PRECISION (type) >= TYPE_PRECISION (itype)
 713             && (POINTER_TYPE_P (type) || INTEGRAL_TYPE_P (type)))
 714           {
 715             split_constant_offset (op0, &var0, off);
 716             *var = fold_convert (type, var0);
 717             return true;
 718           }
 719         return false;
 720       }
 721
 722     default:
 723       return false;
 724     }
 725 }
 726
 727 /* Expresses EXP as VAR + OFF, where off is a constant.  The type of OFF
 728    will be ssizetype.  */
 729
 730 void
 731 split_constant_offset (tree exp, tree *var, tree *off)
 732 {
 733   tree type = TREE_TYPE (exp), otype, op0, op1, e, o;
 734   enum tree_code code;
 735
 736   *var = exp;
 737   *off = ssize_int (0);
 738   STRIP_NOPS (exp);
 739
 740   if (tree_is_chrec (exp)
 741       || get_gimple_rhs_class (TREE_CODE (exp)) == GIMPLE_TERNARY_RHS)
 742     return;
 743
 744   otype = TREE_TYPE (exp);
 745   code = TREE_CODE (exp);
 746   extract_ops_from_tree (exp, &code, &op0, &op1);
 747   if (split_constant_offset_1 (otype, op0, code, op1, &e, &o))
 748     {
 749       *var = fold_convert (type, e);
 750       *off = o;
 751     }
 752 }
 753
 754 /* Returns the address ADDR of an object in a canonical shape (without nop
 755    casts, and with type of pointer to the object).  */
 756
 757 static tree
 758 canonicalize_base_object_address (tree addr)
 759 {
 760   tree orig = addr;
 761
 762   STRIP_NOPS (addr);
 763
 764   /* The base address may be obtained by casting from integer, in that case
 765      keep the cast.  */
 766   if (!POINTER_TYPE_P (TREE_TYPE (addr)))
 767     return orig;
 768
 769   if (TREE_CODE (addr) != ADDR_EXPR)
 770     return addr;
 771
 772   return build_fold_addr_expr (TREE_OPERAND (addr, 0));
 773 }
 774
 775 /* Analyzes the behavior of the memory reference DR in the innermost loop or
 776    basic block that contains it.  Returns true if analysis succeed or false
 777    otherwise.  */
 778
 779 bool
 780 dr_analyze_innermost (struct data_reference *dr, struct loop *nest)
 781 {
 782   gimple stmt = DR_STMT (dr);
 783   struct loop *loop = loop_containing_stmt (stmt);
 784   tree ref = DR_REF (dr);
 785   HOST_WIDE_INT pbitsize, pbitpos;
 786   tree base, poffset;
 787   machine_mode pmode;
 788   int punsignedp, preversep, pvolatilep;
 789   affine_iv base_iv, offset_iv;
 790   tree init, dinit, step;
 791   bool in_loop = (loop && loop->num);
 792
 793   if (dump_file && (dump_flags & TDF_DETAILS))
 794     fprintf (dump_file, "analyze_innermost: ");
 795
 796   base = get_inner_reference (ref, &pbitsize, &pbitpos, &poffset, &pmode,
 797                               &punsignedp, &preversep, &pvolatilep, false);
 798   gcc_assert (base != NULL_TREE);
 799
 800   if (pbitpos % BITS_PER_UNIT != 0)
 801     {
 802       if (dump_file && (dump_flags & TDF_DETAILS))
 803         fprintf (dump_file, "failed: bit offset alignment.\n");
 804       return false;
 805     }
 806
 807   if (preversep)
 808     {
 809       if (dump_file && (dump_flags & TDF_DETAILS))
 810         fprintf (dump_file, "failed: reverse storage order.\n");
 811       return false;
 812     }
 813
 814   if (TREE_CODE (base) == MEM_REF)
 815     {
 816       if (!integer_zerop (TREE_OPERAND (base, 1)))
 817         {
 818           offset_int moff = mem_ref_offset (base);
 819           tree mofft = wide_int_to_tree (sizetype, moff);
 820           if (!poffset)
 821             poffset = mofft;
 822           else
 823             poffset = size_binop (PLUS_EXPR, poffset, mofft);
 824         }
 825       base = TREE_OPERAND (base, 0);
 826     }
 827   else
 828     base = build_fold_addr_expr (base);
 829
 830   if (in_loop)
 831     {
 832       if (!simple_iv (loop, loop_containing_stmt (stmt), base, &base_iv,
 833                       nest ? true : false))
 834         {
 835           if (nest)
 836             {
 837               if (dump_file && (dump_flags & TDF_DETAILS))
 838                 fprintf (dump_file, "failed: evolution of base is not"
 839                                     " affine.\n");
 840               return false;
 841             }
 842           else
 843             {
 844               base_iv.base = base;
 845               base_iv.step = ssize_int (0);
 846               base_iv.no_overflow = true;
 847             }
 848         }
 849     }
 850   else
 851     {
 852       base_iv.base = base;
 853       base_iv.step = ssize_int (0);
 854       base_iv.no_overflow = true;
 855     }
 856
 857   if (!poffset)
 858     {
 859       offset_iv.base = ssize_int (0);
 860       offset_iv.step = ssize_int (0);
 861     }
 862   else
 863     {
 864       if (!in_loop)
 865         {
 866           offset_iv.base = poffset;
 867           offset_iv.step = ssize_int (0);
 868         }
 869       else if (!simple_iv (loop, loop_containing_stmt (stmt),
 870                            poffset, &offset_iv,
 871                            nest ? true : false))
 872         {
 873           if (nest)
 874             {
 875               if (dump_file && (dump_flags & TDF_DETAILS))
 876                 fprintf (dump_file, "failed: evolution of offset is not"
 877                                     " affine.\n");
 878               return false;
 879             }
 880           else
 881             {
 882               offset_iv.base = poffset;
 883               offset_iv.step = ssize_int (0);
 884             }
 885         }
 886     }
 887
 888   init = ssize_int (pbitpos / BITS_PER_UNIT);
 889   split_constant_offset (base_iv.base, &base_iv.base, &dinit);
 890   init =  size_binop (PLUS_EXPR, init, dinit);
 891   split_constant_offset (offset_iv.base, &offset_iv.base, &dinit);
 892   init =  size_binop (PLUS_EXPR, init, dinit);
 893
 894   step = size_binop (PLUS_EXPR,
 895                      fold_convert (ssizetype, base_iv.step),
 896                      fold_convert (ssizetype, offset_iv.step));
 897
 898   DR_BASE_ADDRESS (dr) = canonicalize_base_object_address (base_iv.base);
 899
 900   DR_OFFSET (dr) = fold_convert (ssizetype, offset_iv.base);
 901   DR_INIT (dr) = init;
 902   DR_STEP (dr) = step;
 903
 904   DR_ALIGNED_TO (dr) = size_int (highest_pow2_factor (offset_iv.base));
 905
 906   if (dump_file && (dump_flags & TDF_DETAILS))
 907     fprintf (dump_file, "success.\n");
 908
 909   return true;
 910 }
 911
 912 /* Determines the base object and the list of indices of memory reference
 913    DR, analyzed in LOOP and instantiated in loop nest NEST.  */
 914
 915 static void
 916 dr_analyze_indices (struct data_reference *dr, loop_p nest, loop_p loop)
 917 {
 918   vec<tree> access_fns = vNULL;
 919   tree ref, op;
 920   tree base, off, access_fn;
 921   basic_block before_loop;
 922
 923   /* If analyzing a basic-block there are no indices to analyze
 924      and thus no access functions.  */
 925   if (!nest)
 926     {
 927       DR_BASE_OBJECT (dr) = DR_REF (dr);
 928       DR_ACCESS_FNS (dr).create (0);
 929       return;
 930     }
 931
 932   ref = DR_REF (dr);
 933   before_loop = block_before_loop (nest);
 934
 935   /* REALPART_EXPR and IMAGPART_EXPR can be handled like accesses
 936      into a two element array with a constant index.  The base is
 937      then just the immediate underlying object.  */
 938   if (TREE_CODE (ref) == REALPART_EXPR)
 939     {
 940       ref = TREE_OPERAND (ref, 0);
 941       access_fns.safe_push (integer_zero_node);
 942     }
 943   else if (TREE_CODE (ref) == IMAGPART_EXPR)
 944     {
 945       ref = TREE_OPERAND (ref, 0);
 946       access_fns.safe_push (integer_one_node);
 947     }
 948
 949   /* Analyze access functions of dimensions we know to be independent.  */
 950   while (handled_component_p (ref))
 951     {
 952       if (TREE_CODE (ref) == ARRAY_REF)
 953         {
 954           op = TREE_OPERAND (ref, 1);
 955           access_fn = analyze_scalar_evolution (loop, op);
 956           access_fn = instantiate_scev (before_loop, loop, access_fn);
 957           access_fns.safe_push (access_fn);
 958         }
 959       else if (TREE_CODE (ref) == COMPONENT_REF
 960                && TREE_CODE (TREE_TYPE (TREE_OPERAND (ref, 0))) == RECORD_TYPE)
 961         {
 962           /* For COMPONENT_REFs of records (but not unions!) use the
 963              FIELD_DECL offset as constant access function so we can
 964              disambiguate a[i].f1 and a[i].f2.  */
 965           tree off = component_ref_field_offset (ref);
 966           off = size_binop (PLUS_EXPR,
 967                             size_binop (MULT_EXPR,
 968                                         fold_convert (bitsizetype, off),
 969                                         bitsize_int (BITS_PER_UNIT)),
 970                             DECL_FIELD_BIT_OFFSET (TREE_OPERAND (ref, 1)));
 971           access_fns.safe_push (off);
 972         }
 973       else
 974         /* If we have an unhandled component we could not translate
 975            to an access function stop analyzing.  We have determined
 976            our base object in this case.  */
 977         break;
 978
 979       ref = TREE_OPERAND (ref, 0);
 980     }
 981
 982   /* If the address operand of a MEM_REF base has an evolution in the
 983      analyzed nest, add it as an additional independent access-function.  */
 984   if (TREE_CODE (ref) == MEM_REF)
 985     {
 986       op = TREE_OPERAND (ref, 0);
 987       access_fn = analyze_scalar_evolution (loop, op);
 988       access_fn = instantiate_scev (before_loop, loop, access_fn);
 989       if (TREE_CODE (access_fn) == POLYNOMIAL_CHREC)
 990         {
 991           tree orig_type;
 992           tree memoff = TREE_OPERAND (ref, 1);
 993           base = initial_condition (access_fn);
 994           orig_type = TREE_TYPE (base);
 995           STRIP_USELESS_TYPE_CONVERSION (base);
 996           split_constant_offset (base, &base, &off);
 997           STRIP_USELESS_TYPE_CONVERSION (base);
 998           /* Fold the MEM_REF offset into the evolutions initial
 999              value to make more bases comparable.  */
1000           if (!integer_zerop (memoff))
1001             {
1002               off = size_binop (PLUS_EXPR, off,
1003                                 fold_convert (ssizetype, memoff));
1004               memoff = build_int_cst (TREE_TYPE (memoff), 0);
1005             }
1006           /* Adjust the offset so it is a multiple of the access type
1007              size and thus we separate bases that can possibly be used
1008              to produce partial overlaps (which the access_fn machinery
1009              cannot handle).  */
1010           wide_int rem;
1011           if (TYPE_SIZE_UNIT (TREE_TYPE (ref))
1012               && TREE_CODE (TYPE_SIZE_UNIT (TREE_TYPE (ref))) == INTEGER_CST
1013               && !integer_zerop (TYPE_SIZE_UNIT (TREE_TYPE (ref))))
1014             rem = wi::mod_trunc (off, TYPE_SIZE_UNIT (TREE_TYPE (ref)), SIGNED);
1015           else
1016             /* If we can't compute the remainder simply force the initial
1017                condition to zero.  */
1018             rem = off;
1019           off = wide_int_to_tree (ssizetype, wi::sub (off, rem));
1020           memoff = wide_int_to_tree (TREE_TYPE (memoff), rem);
1021           /* And finally replace the initial condition.  */
1022           access_fn = chrec_replace_initial_condition
1023               (access_fn, fold_convert (orig_type, off));
1024           /* ???  This is still not a suitable base object for
1025              dr_may_alias_p - the base object needs to be an
1026              access that covers the object as whole.  With
1027              an evolution in the pointer this cannot be
1028              guaranteed.
1029              As a band-aid, mark the access so we can special-case
1030              it in dr_may_alias_p.  */
1031           tree old = ref;
1032           ref = fold_build2_loc (EXPR_LOCATION (ref),
1033                                  MEM_REF, TREE_TYPE (ref),
1034                                  base, memoff);
1035           MR_DEPENDENCE_CLIQUE (ref) = MR_DEPENDENCE_CLIQUE (old);
1036           MR_DEPENDENCE_BASE (ref) = MR_DEPENDENCE_BASE (old);
1037           DR_UNCONSTRAINED_BASE (dr) = true;
1038           access_fns.safe_push (access_fn);
1039         }
1040     }
1041   else if (DECL_P (ref))
1042     {
1043       /* Canonicalize DR_BASE_OBJECT to MEM_REF form.  */
1044       ref = build2 (MEM_REF, TREE_TYPE (ref),
1045                     build_fold_addr_expr (ref),
1046                     build_int_cst (reference_alias_ptr_type (ref), 0));
1047     }
1048
1049   DR_BASE_OBJECT (dr) = ref;
1050   DR_ACCESS_FNS (dr) = access_fns;
1051 }
1052
1053 /* Extracts the alias analysis information from the memory reference DR.  */
1054
1055 static void
1056 dr_analyze_alias (struct data_reference *dr)
1057 {
1058   tree ref = DR_REF (dr);
1059   tree base = get_base_address (ref), addr;
1060
1061   if (INDIRECT_REF_P (base)
1062       || TREE_CODE (base) == MEM_REF)
1063     {
1064       addr = TREE_OPERAND (base, 0);
1065       if (TREE_CODE (addr) == SSA_NAME)
1066         DR_PTR_INFO (dr) = SSA_NAME_PTR_INFO (addr);
1067     }
1068 }
1069
1070 /* Frees data reference DR.  */
1071
1072 void
1073 free_data_ref (data_reference_p dr)
1074 {
1075   DR_ACCESS_FNS (dr).release ();
1076   free (dr);
1077 }
1078
1079 /* Analyzes memory reference MEMREF accessed in STMT.  The reference
1080    is read if IS_READ is true, write otherwise.  Returns the
1081    data_reference description of MEMREF.  NEST is the outermost loop
1082    in which the reference should be instantiated, LOOP is the loop in
1083    which the data reference should be analyzed.  */
1084
1085 struct data_reference *
1086 create_data_ref (loop_p nest, loop_p loop, tree memref, gimple stmt,
1087                  bool is_read)
1088 {
1089   struct data_reference *dr;
1090
1091   if (dump_file && (dump_flags & TDF_DETAILS))
1092     {
1093       fprintf (dump_file, "Creating dr for ");
1094       print_generic_expr (dump_file, memref, TDF_SLIM);
1095       fprintf (dump_file, "\n");
1096     }
1097
1098   dr = XCNEW (struct data_reference);
1099   DR_STMT (dr) = stmt;
1100   DR_REF (dr) = memref;
1101   DR_IS_READ (dr) = is_read;
1102
1103   dr_analyze_innermost (dr, nest);
1104   dr_analyze_indices (dr, nest, loop);
1105   dr_analyze_alias (dr);
1106
1107   if (dump_file && (dump_flags & TDF_DETAILS))
1108     {
1109       unsigned i;
1110       fprintf (dump_file, "\tbase_address: ");
1111       print_generic_expr (dump_file, DR_BASE_ADDRESS (dr), TDF_SLIM);
1112       fprintf (dump_file, "\n\toffset from base address: ");
1113       print_generic_expr (dump_file, DR_OFFSET (dr), TDF_SLIM);
1114       fprintf (dump_file, "\n\tconstant offset from base address: ");
1115       print_generic_expr (dump_file, DR_INIT (dr), TDF_SLIM);
1116       fprintf (dump_file, "\n\tstep: ");
1117       print_generic_expr (dump_file, DR_STEP (dr), TDF_SLIM);
1118       fprintf (dump_file, "\n\taligned to: ");
1119       print_generic_expr (dump_file, DR_ALIGNED_TO (dr), TDF_SLIM);
1120       fprintf (dump_file, "\n\tbase_object: ");
1121       print_generic_expr (dump_file, DR_BASE_OBJECT (dr), TDF_SLIM);
1122       fprintf (dump_file, "\n");
1123       for (i = 0; i < DR_NUM_DIMENSIONS (dr); i++)
1124         {
1125           fprintf (dump_file, "\tAccess function %d: ", i);
1126           print_generic_stmt (dump_file, DR_ACCESS_FN (dr, i), TDF_SLIM);
1127         }
1128     }
1129
1130   return dr;
1131 }
1132
1133 /* Check if OFFSET1 and OFFSET2 (DR_OFFSETs of some data-refs) are identical
1134    expressions.  */
1135 static bool
1136 dr_equal_offsets_p1 (tree offset1, tree offset2)
1137 {
1138   bool res;
1139
1140   STRIP_NOPS (offset1);
1141   STRIP_NOPS (offset2);
1142
1143   if (offset1 == offset2)
1144     return true;
1145
1146   if (TREE_CODE (offset1) != TREE_CODE (offset2)
1147       || (!BINARY_CLASS_P (offset1) && !UNARY_CLASS_P (offset1)))
1148     return false;
1149
1150   res = dr_equal_offsets_p1 (TREE_OPERAND (offset1, 0),
1151                              TREE_OPERAND (offset2, 0));
1152
1153   if (!res || !BINARY_CLASS_P (offset1))
1154     return res;
1155
1156   res = dr_equal_offsets_p1 (TREE_OPERAND (offset1, 1),
1157                              TREE_OPERAND (offset2, 1));
1158
1159   return res;
1160 }
1161
1162 /* Check if DRA and DRB have equal offsets.  */
1163 bool
1164 dr_equal_offsets_p (struct data_reference *dra,
1165                     struct data_reference *drb)
1166 {
1167   tree offset1, offset2;
1168
1169   offset1 = DR_OFFSET (dra);
1170   offset2 = DR_OFFSET (drb);
1171
1172   return dr_equal_offsets_p1 (offset1, offset2);
1173 }
1174
1175 /* Returns true if FNA == FNB.  */
1176
1177 static bool
1178 affine_function_equal_p (affine_fn fna, affine_fn fnb)
1179 {
1180   unsigned i, n = fna.length ();
1181
1182   if (n != fnb.length ())
1183     return false;
1184
1185   for (i = 0; i < n; i++)
1186     if (!operand_equal_p (fna[i], fnb[i], 0))
1187       return false;
1188
1189   return true;
1190 }
1191
1192 /* If all the functions in CF are the same, returns one of them,
1193    otherwise returns NULL.  */
1194
1195 static affine_fn
1196 common_affine_function (conflict_function *cf)
1197 {
1198   unsigned i;
1199   affine_fn comm;
1200
1201   if (!CF_NONTRIVIAL_P (cf))
1202     return affine_fn ();
1203
1204   comm = cf->fns[0];
1205
1206   for (i = 1; i < cf->n; i++)
1207     if (!affine_function_equal_p (comm, cf->fns[i]))
1208       return affine_fn ();
1209
1210   return comm;
1211 }
1212
1213 /* Returns the base of the affine function FN.  */
1214
1215 static tree
1216 affine_function_base (affine_fn fn)
1217 {
1218   return fn[0];
1219 }
1220
1221 /* Returns true if FN is a constant.  */
1222
1223 static bool
1224 affine_function_constant_p (affine_fn fn)
1225 {
1226   unsigned i;
1227   tree coef;
1228
1229   for (i = 1; fn.iterate (i, &coef); i++)
1230     if (!integer_zerop (coef))
1231       return false;
1232
1233   return true;
1234 }
1235
1236 /* Returns true if FN is the zero constant function.  */
1237
1238 static bool
1239 affine_function_zero_p (affine_fn fn)
1240 {
1241   return (integer_zerop (affine_function_base (fn))
1242           && affine_function_constant_p (fn));
1243 }
1244
1245 /* Returns a signed integer type with the largest precision from TA
1246    and TB.  */
1247
1248 static tree
1249 signed_type_for_types (tree ta, tree tb)
1250 {
1251   if (TYPE_PRECISION (ta) > TYPE_PRECISION (tb))
1252     return signed_type_for (ta);
1253   else
1254     return signed_type_for (tb);
1255 }
1256
1257 /* Applies operation OP on affine functions FNA and FNB, and returns the
1258    result.  */
1259
1260 static affine_fn
1261 affine_fn_op (enum tree_code op, affine_fn fna, affine_fn fnb)
1262 {
1263   unsigned i, n, m;
1264   affine_fn ret;
1265   tree coef;
1266
1267   if (fnb.length () > fna.length ())
1268     {
1269       n = fna.length ();
1270       m = fnb.length ();
1271     }
1272   else
1273     {
1274       n = fnb.length ();
1275       m = fna.length ();
1276     }
1277
1278   ret.create (m);
1279   for (i = 0; i < n; i++)
1280     {
1281       tree type = signed_type_for_types (TREE_TYPE (fna[i]),
1282                                          TREE_TYPE (fnb[i]));
1283       ret.quick_push (fold_build2 (op, type, fna[i], fnb[i]));
1284     }
1285
1286   for (; fna.iterate (i, &coef); i++)
1287     ret.quick_push (fold_build2 (op, signed_type_for (TREE_TYPE (coef)),
1288                                  coef, integer_zero_node));
1289   for (; fnb.iterate (i, &coef); i++)
1290     ret.quick_push (fold_build2 (op, signed_type_for (TREE_TYPE (coef)),
1291                                  integer_zero_node, coef));
1292
1293   return ret;
1294 }
1295
1296 /* Returns the sum of affine functions FNA and FNB.  */
1297
1298 static affine_fn
1299 affine_fn_plus (affine_fn fna, affine_fn fnb)
1300 {
1301   return affine_fn_op (PLUS_EXPR, fna, fnb);
1302 }
1303
1304 /* Returns the difference of affine functions FNA and FNB.  */
1305
1306 static affine_fn
1307 affine_fn_minus (affine_fn fna, affine_fn fnb)
1308 {
1309   return affine_fn_op (MINUS_EXPR, fna, fnb);
1310 }
1311
1312 /* Frees affine function FN.  */
1313
1314 static void
1315 affine_fn_free (affine_fn fn)
1316 {
1317   fn.release ();
1318 }
1319
1320 /* Determine for each subscript in the data dependence relation DDR
1321    the distance.  */
1322
1323 static void
1324 compute_subscript_distance (struct data_dependence_relation *ddr)
1325 {
1326   conflict_function *cf_a, *cf_b;
1327   affine_fn fn_a, fn_b, diff;
1328
1329   if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
1330     {
1331       unsigned int i;
1332
1333       for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
1334         {
1335           struct subscript *subscript;
1336
1337           subscript = DDR_SUBSCRIPT (ddr, i);
1338           cf_a = SUB_CONFLICTS_IN_A (subscript);
1339           cf_b = SUB_CONFLICTS_IN_B (subscript);
1340
1341           fn_a = common_affine_function (cf_a);
1342           fn_b = common_affine_function (cf_b);
1343           if (!fn_a.exists () || !fn_b.exists ())
1344             {
1345               SUB_DISTANCE (subscript) = chrec_dont_know;
1346               return;
1347             }
1348           diff = affine_fn_minus (fn_a, fn_b);
1349
1350           if (affine_function_constant_p (diff))
1351             SUB_DISTANCE (subscript) = affine_function_base (diff);
1352           else
1353             SUB_DISTANCE (subscript) = chrec_dont_know;
1354
1355           affine_fn_free (diff);
1356         }
1357     }
1358 }
1359
1360 /* Returns the conflict function for "unknown".  */
1361
1362 static conflict_function *
1363 conflict_fn_not_known (void)
1364 {
1365   conflict_function *fn = XCNEW (conflict_function);
1366   fn->n = NOT_KNOWN;
1367
1368   return fn;
1369 }
1370
1371 /* Returns the conflict function for "independent".  */
1372
1373 static conflict_function *
1374 conflict_fn_no_dependence (void)
1375 {
1376   conflict_function *fn = XCNEW (conflict_function);
1377   fn->n = NO_DEPENDENCE;
1378
1379   return fn;
1380 }
1381
1382 /* Returns true if the address of OBJ is invariant in LOOP.  */
1383
1384 static bool
1385 object_address_invariant_in_loop_p (const struct loop *loop, const_tree obj)
1386 {
1387   while (handled_component_p (obj))
1388     {
1389       if (TREE_CODE (obj) == ARRAY_REF)
1390         {
1391           /* Index of the ARRAY_REF was zeroed in analyze_indices, thus we only
1392              need to check the stride and the lower bound of the reference.  */
1393           if (chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 2),
1394                                                       loop->num)
1395               || chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 3),
1396                                                          loop->num))
1397             return false;
1398         }
1399       else if (TREE_CODE (obj) == COMPONENT_REF)
1400         {
1401           if (chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 2),
1402                                                       loop->num))
1403             return false;
1404         }
1405       obj = TREE_OPERAND (obj, 0);
1406     }
1407
1408   if (!INDIRECT_REF_P (obj)
1409       && TREE_CODE (obj) != MEM_REF)
1410     return true;
1411
1412   return !chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 0),
1413                                                   loop->num);
1414 }
1415
1416 /* Returns false if we can prove that data references A and B do not alias,
1417    true otherwise.  If LOOP_NEST is false no cross-iteration aliases are
1418    considered.  */
1419
1420 bool
1421 dr_may_alias_p (const struct data_reference *a, const struct data_reference *b,
1422                 bool loop_nest)
1423 {
1424   tree addr_a = DR_BASE_OBJECT (a);
1425   tree addr_b = DR_BASE_OBJECT (b);
1426
1427   /* If we are not processing a loop nest but scalar code we
1428      do not need to care about possible cross-iteration dependences
1429      and thus can process the full original reference.  Do so,
1430      similar to how loop invariant motion applies extra offset-based
1431      disambiguation.  */
1432   if (!loop_nest)
1433     {
1434       aff_tree off1, off2;
1435       widest_int size1, size2;
1436       get_inner_reference_aff (DR_REF (a), &off1, &size1);
1437       get_inner_reference_aff (DR_REF (b), &off2, &size2);
1438       aff_combination_scale (&off1, -1);
1439       aff_combination_add (&off2, &off1);
1440       if (aff_comb_cannot_overlap_p (&off2, size1, size2))
1441         return false;
1442     }
1443
1444   if ((TREE_CODE (addr_a) == MEM_REF || TREE_CODE (addr_a) == TARGET_MEM_REF)
1445       && (TREE_CODE (addr_b) == MEM_REF || TREE_CODE (addr_b) == TARGET_MEM_REF)
1446       && MR_DEPENDENCE_CLIQUE (addr_a) == MR_DEPENDENCE_CLIQUE (addr_b)
1447       && MR_DEPENDENCE_BASE (addr_a) != MR_DEPENDENCE_BASE (addr_b))
1448     return false;
1449
1450   /* If we had an evolution in a pointer-based MEM_REF BASE_OBJECT we
1451      do not know the size of the base-object.  So we cannot do any
1452      offset/overlap based analysis but have to rely on points-to
1453      information only.  */
1454   if (TREE_CODE (addr_a) == MEM_REF
1455       && (DR_UNCONSTRAINED_BASE (a)
1456           || TREE_CODE (TREE_OPERAND (addr_a, 0)) == SSA_NAME))
1457     {
1458       /* For true dependences we can apply TBAA.  */
1459       if (flag_strict_aliasing
1460           && DR_IS_WRITE (a) && DR_IS_READ (b)
1461           && !alias_sets_conflict_p (get_alias_set (DR_REF (a)),
1462                                      get_alias_set (DR_REF (b))))
1463         return false;
1464       if (TREE_CODE (addr_b) == MEM_REF)
1465         return ptr_derefs_may_alias_p (TREE_OPERAND (addr_a, 0),
1466                                        TREE_OPERAND (addr_b, 0));
1467       else
1468         return ptr_derefs_may_alias_p (TREE_OPERAND (addr_a, 0),
1469                                        build_fold_addr_expr (addr_b));
1470     }
1471   else if (TREE_CODE (addr_b) == MEM_REF
1472            && (DR_UNCONSTRAINED_BASE (b)
1473                || TREE_CODE (TREE_OPERAND (addr_b, 0)) == SSA_NAME))
1474     {
1475       /* For true dependences we can apply TBAA.  */
1476       if (flag_strict_aliasing
1477           && DR_IS_WRITE (a) && DR_IS_READ (b)
1478           && !alias_sets_conflict_p (get_alias_set (DR_REF (a)),
1479                                      get_alias_set (DR_REF (b))))
1480         return false;
1481       if (TREE_CODE (addr_a) == MEM_REF)
1482         return ptr_derefs_may_alias_p (TREE_OPERAND (addr_a, 0),
1483                                        TREE_OPERAND (addr_b, 0));
1484       else
1485         return ptr_derefs_may_alias_p (build_fold_addr_expr (addr_a),
1486                                        TREE_OPERAND (addr_b, 0));
1487     }
1488
1489   /* Otherwise DR_BASE_OBJECT is an access that covers the whole object
1490      that is being subsetted in the loop nest.  */
1491   if (DR_IS_WRITE (a) && DR_IS_WRITE (b))
1492     return refs_output_dependent_p (addr_a, addr_b);
1493   else if (DR_IS_READ (a) && DR_IS_WRITE (b))
1494     return refs_anti_dependent_p (addr_a, addr_b);
1495   return refs_may_alias_p (addr_a, addr_b);
1496 }
1497
1498 /* Initialize a data dependence relation between data accesses A and
1499    B.  NB_LOOPS is the number of loops surrounding the references: the
1500    size of the classic distance/direction vectors.  */
1501
1502 struct data_dependence_relation *
1503 initialize_data_dependence_relation (struct data_reference *a,
1504                                      struct data_reference *b,
1505                                      vec<loop_p> loop_nest)
1506 {
1507   struct data_dependence_relation *res;
1508   unsigned int i;
1509
1510   res = XNEW (struct data_dependence_relation);
1511   DDR_A (res) = a;
1512   DDR_B (res) = b;
1513   DDR_LOOP_NEST (res).create (0);
1514   DDR_REVERSED_P (res) = false;
1515   DDR_SUBSCRIPTS (res).create (0);
1516   DDR_DIR_VECTS (res).create (0);
1517   DDR_DIST_VECTS (res).create (0);
1518
1519   if (a == NULL || b == NULL)
1520     {
1521       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1522       return res;
1523     }
1524
1525   /* If the data references do not alias, then they are independent.  */
1526   if (!dr_may_alias_p (a, b, loop_nest.exists ()))
1527     {
1528       DDR_ARE_DEPENDENT (res) = chrec_known;
1529       return res;
1530     }
1531
1532   /* The case where the references are exactly the same.  */
1533   if (operand_equal_p (DR_REF (a), DR_REF (b), 0))
1534     {
1535      if (loop_nest.exists ()
1536         && !object_address_invariant_in_loop_p (loop_nest[0],
1537                                                 DR_BASE_OBJECT (a)))
1538       {
1539         DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1540         return res;
1541       }
1542       DDR_AFFINE_P (res) = true;
1543       DDR_ARE_DEPENDENT (res) = NULL_TREE;
1544       DDR_SUBSCRIPTS (res).create (DR_NUM_DIMENSIONS (a));
1545       DDR_LOOP_NEST (res) = loop_nest;
1546       DDR_INNER_LOOP (res) = 0;
1547       DDR_SELF_REFERENCE (res) = true;
1548       for (i = 0; i < DR_NUM_DIMENSIONS (a); i++)
1549        {
1550          struct subscript *subscript;
1551
1552          subscript = XNEW (struct subscript);
1553          SUB_CONFLICTS_IN_A (subscript) = conflict_fn_not_known ();
1554          SUB_CONFLICTS_IN_B (subscript) = conflict_fn_not_known ();
1555          SUB_LAST_CONFLICT (subscript) = chrec_dont_know;
1556          SUB_DISTANCE (subscript) = chrec_dont_know;
1557          DDR_SUBSCRIPTS (res).safe_push (subscript);
1558        }
1559       return res;
1560     }
1561
1562   /* If the references do not access the same object, we do not know
1563      whether they alias or not.  */
1564   if (!operand_equal_p (DR_BASE_OBJECT (a), DR_BASE_OBJECT (b), 0))
1565     {
1566       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1567       return res;
1568     }
1569
1570   /* If the base of the object is not invariant in the loop nest, we cannot
1571      analyze it.  TODO -- in fact, it would suffice to record that there may
1572      be arbitrary dependences in the loops where the base object varies.  */
1573   if (loop_nest.exists ()
1574       && !object_address_invariant_in_loop_p (loop_nest[0],
1575                                               DR_BASE_OBJECT (a)))
1576     {
1577       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1578       return res;
1579     }
1580
1581   /* If the number of dimensions of the access to not agree we can have
1582      a pointer access to a component of the array element type and an
1583      array access while the base-objects are still the same.  Punt.  */
1584   if (DR_NUM_DIMENSIONS (a) != DR_NUM_DIMENSIONS (b))
1585     {
1586       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1587       return res;
1588     }
1589
1590   DDR_AFFINE_P (res) = true;
1591   DDR_ARE_DEPENDENT (res) = NULL_TREE;
1592   DDR_SUBSCRIPTS (res).create (DR_NUM_DIMENSIONS (a));
1593   DDR_LOOP_NEST (res) = loop_nest;
1594   DDR_INNER_LOOP (res) = 0;
1595   DDR_SELF_REFERENCE (res) = false;
1596
1597   for (i = 0; i < DR_NUM_DIMENSIONS (a); i++)
1598     {
1599       struct subscript *subscript;
1600
1601       subscript = XNEW (struct subscript);
1602       SUB_CONFLICTS_IN_A (subscript) = conflict_fn_not_known ();
1603       SUB_CONFLICTS_IN_B (subscript) = conflict_fn_not_known ();
1604       SUB_LAST_CONFLICT (subscript) = chrec_dont_know;
1605       SUB_DISTANCE (subscript) = chrec_dont_know;
1606       DDR_SUBSCRIPTS (res).safe_push (subscript);
1607     }
1608
1609   return res;
1610 }
1611
1612 /* Frees memory used by the conflict function F.  */
1613
1614 static void
1615 free_conflict_function (conflict_function *f)
1616 {
1617   unsigned i;
1618
1619   if (CF_NONTRIVIAL_P (f))
1620     {
1621       for (i = 0; i < f->n; i++)
1622         affine_fn_free (f->fns[i]);
1623     }
1624   free (f);
1625 }
1626
1627 /* Frees memory used by SUBSCRIPTS.  */
1628
1629 static void
1630 free_subscripts (vec<subscript_p> subscripts)
1631 {
1632   unsigned i;
1633   subscript_p s;
1634
1635   FOR_EACH_VEC_ELT (subscripts, i, s)
1636     {
1637       free_conflict_function (s->conflicting_iterations_in_a);
1638       free_conflict_function (s->conflicting_iterations_in_b);
1639       free (s);
1640     }
1641   subscripts.release ();
1642 }
1643
1644 /* Set DDR_ARE_DEPENDENT to CHREC and finalize the subscript overlap
1645    description.  */
1646
1647 static inline void
1648 finalize_ddr_dependent (struct data_dependence_relation *ddr,
1649                         tree chrec)
1650 {
1651   DDR_ARE_DEPENDENT (ddr) = chrec;
1652   free_subscripts (DDR_SUBSCRIPTS (ddr));
1653   DDR_SUBSCRIPTS (ddr).create (0);
1654 }
1655
1656 /* The dependence relation DDR cannot be represented by a distance
1657    vector.  */
1658
1659 static inline void
1660 non_affine_dependence_relation (struct data_dependence_relation *ddr)
1661 {
1662   if (dump_file && (dump_flags & TDF_DETAILS))
1663     fprintf (dump_file, "(Dependence relation cannot be represented by distance vector.) \n");
1664
1665   DDR_AFFINE_P (ddr) = false;
1666 }
1667
1668 \f
1669
1670 /* This section contains the classic Banerjee tests.  */
1671
1672 /* Returns true iff CHREC_A and CHREC_B are not dependent on any index
1673    variables, i.e., if the ZIV (Zero Index Variable) test is true.  */
1674
1675 static inline bool
1676 ziv_subscript_p (const_tree chrec_a, const_tree chrec_b)
1677 {
1678   return (evolution_function_is_constant_p (chrec_a)
1679           && evolution_function_is_constant_p (chrec_b));
1680 }
1681
1682 /* Returns true iff CHREC_A and CHREC_B are dependent on an index
1683    variable, i.e., if the SIV (Single Index Variable) test is true.  */
1684
1685 static bool
1686 siv_subscript_p (const_tree chrec_a, const_tree chrec_b)
1687 {
1688   if ((evolution_function_is_constant_p (chrec_a)
1689        && evolution_function_is_univariate_p (chrec_b))
1690       || (evolution_function_is_constant_p (chrec_b)
1691           && evolution_function_is_univariate_p (chrec_a)))
1692     return true;
1693
1694   if (evolution_function_is_univariate_p (chrec_a)
1695       && evolution_function_is_univariate_p (chrec_b))
1696     {
1697       switch (TREE_CODE (chrec_a))
1698         {
1699         case POLYNOMIAL_CHREC:
1700           switch (TREE_CODE (chrec_b))
1701             {
1702             case POLYNOMIAL_CHREC:
1703               if (CHREC_VARIABLE (chrec_a) != CHREC_VARIABLE (chrec_b))
1704                 return false;
1705
1706             default:
1707               return true;
1708             }
1709
1710         default:
1711           return true;
1712         }
1713     }
1714
1715   return false;
1716 }
1717
1718 /* Creates a conflict function with N dimensions.  The affine functions
1719    in each dimension follow.  */
1720
1721 static conflict_function *
1722 conflict_fn (unsigned n, ...)
1723 {
1724   unsigned i;
1725   conflict_function *ret = XCNEW (conflict_function);
1726   va_list ap;
1727
1728   gcc_assert (0 < n && n <= MAX_DIM);
1729   va_start (ap, n);
1730
1731   ret->n = n;
1732   for (i = 0; i < n; i++)
1733     ret->fns[i] = va_arg (ap, affine_fn);
1734   va_end (ap);
1735
1736   return ret;
1737 }
1738
1739 /* Returns constant affine function with value CST.  */
1740
1741 static affine_fn
1742 affine_fn_cst (tree cst)
1743 {
1744   affine_fn fn;
1745   fn.create (1);
1746   fn.quick_push (cst);
1747   return fn;
1748 }
1749
1750 /* Returns affine function with single variable, CST + COEF * x_DIM.  */
1751
1752 static affine_fn
1753 affine_fn_univar (tree cst, unsigned dim, tree coef)
1754 {
1755   affine_fn fn;
1756   fn.create (dim + 1);
1757   unsigned i;
1758
1759   gcc_assert (dim > 0);
1760   fn.quick_push (cst);
1761   for (i = 1; i < dim; i++)
1762     fn.quick_push (integer_zero_node);
1763   fn.quick_push (coef);
1764   return fn;
1765 }
1766
1767 /* Analyze a ZIV (Zero Index Variable) subscript.  *OVERLAPS_A and
1768    *OVERLAPS_B are initialized to the functions that describe the
1769    relation between the elements accessed twice by CHREC_A and
1770    CHREC_B.  For k >= 0, the following property is verified:
1771
1772    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
1773
1774 static void
1775 analyze_ziv_subscript (tree chrec_a,
1776                        tree chrec_b,
1777                        conflict_function **overlaps_a,
1778                        conflict_function **overlaps_b,
1779                        tree *last_conflicts)
1780 {
1781   tree type, difference;
1782   dependence_stats.num_ziv++;
1783
1784   if (dump_file && (dump_flags & TDF_DETAILS))
1785     fprintf (dump_file, "(analyze_ziv_subscript \n");
1786
1787   type = signed_type_for_types (TREE_TYPE (chrec_a), TREE_TYPE (chrec_b));
1788   chrec_a = chrec_convert (type, chrec_a, NULL);
1789   chrec_b = chrec_convert (type, chrec_b, NULL);
1790   difference = chrec_fold_minus (type, chrec_a, chrec_b);
1791
1792   switch (TREE_CODE (difference))
1793     {
1794     case INTEGER_CST:
1795       if (integer_zerop (difference))
1796         {
1797           /* The difference is equal to zero: the accessed index
1798              overlaps for each iteration in the loop.  */
1799           *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1800           *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
1801           *last_conflicts = chrec_dont_know;
1802           dependence_stats.num_ziv_dependent++;
1803         }
1804       else
1805         {
1806           /* The accesses do not overlap.  */
1807           *overlaps_a = conflict_fn_no_dependence ();
1808           *overlaps_b = conflict_fn_no_dependence ();
1809           *last_conflicts = integer_zero_node;
1810           dependence_stats.num_ziv_independent++;
1811         }
1812       break;
1813
1814     default:
1815       /* We're not sure whether the indexes overlap.  For the moment,
1816          conservatively answer "don't know".  */
1817       if (dump_file && (dump_flags & TDF_DETAILS))
1818         fprintf (dump_file, "ziv test failed: difference is non-integer.\n");
1819
1820       *overlaps_a = conflict_fn_not_known ();
1821       *overlaps_b = conflict_fn_not_known ();
1822       *last_conflicts = chrec_dont_know;
1823       dependence_stats.num_ziv_unimplemented++;
1824       break;
1825     }
1826
1827   if (dump_file && (dump_flags & TDF_DETAILS))
1828     fprintf (dump_file, ")\n");
1829 }
1830
1831 /* Similar to max_stmt_executions_int, but returns the bound as a tree,
1832    and only if it fits to the int type.  If this is not the case, or the
1833    bound  on the number of iterations of LOOP could not be derived, returns
1834    chrec_dont_know.  */
1835
1836 static tree
1837 max_stmt_executions_tree (struct loop *loop)
1838 {
1839   widest_int nit;
1840
1841   if (!max_stmt_executions (loop, &nit))
1842     return chrec_dont_know;
1843
1844   if (!wi::fits_to_tree_p (nit, unsigned_type_node))
1845     return chrec_dont_know;
1846
1847   return wide_int_to_tree (unsigned_type_node, nit);
1848 }
1849
1850 /* Determine whether the CHREC is always positive/negative.  If the expression
1851    cannot be statically analyzed, return false, otherwise set the answer into
1852    VALUE.  */
1853
1854 static bool
1855 chrec_is_positive (tree chrec, bool *value)
1856 {
1857   bool value0, value1, value2;
1858   tree end_value, nb_iter;
1859
1860   switch (TREE_CODE (chrec))
1861     {
1862     case POLYNOMIAL_CHREC:
1863       if (!chrec_is_positive (CHREC_LEFT (chrec), &value0)
1864           || !chrec_is_positive (CHREC_RIGHT (chrec), &value1))
1865         return false;
1866
1867       /* FIXME -- overflows.  */
1868       if (value0 == value1)
1869         {
1870           *value = value0;
1871           return true;
1872         }
1873
1874       /* Otherwise the chrec is under the form: "{-197, +, 2}_1",
1875          and the proof consists in showing that the sign never
1876          changes during the execution of the loop, from 0 to
1877          loop->nb_iterations.  */
1878       if (!evolution_function_is_affine_p (chrec))
1879         return false;
1880
1881       nb_iter = number_of_latch_executions (get_chrec_loop (chrec));
1882       if (chrec_contains_undetermined (nb_iter))
1883         return false;
1884
1885 #if 0
1886       /* TODO -- If the test is after the exit, we may decrease the number of
1887          iterations by one.  */
1888       if (after_exit)
1889         nb_iter = chrec_fold_minus (type, nb_iter, build_int_cst (type, 1));
1890 #endif
1891
1892       end_value = chrec_apply (CHREC_VARIABLE (chrec), chrec, nb_iter);
1893
1894       if (!chrec_is_positive (end_value, &value2))
1895         return false;
1896
1897       *value = value0;
1898       return value0 == value1;
1899
1900     case INTEGER_CST:
1901       switch (tree_int_cst_sgn (chrec))
1902         {
1903         case -1:
1904           *value = false;
1905           break;
1906         case 1:
1907           *value = true;
1908           break;
1909         default:
1910           return false;
1911         }
1912       return true;
1913
1914     default:
1915       return false;
1916     }
1917 }
1918
1919
1920 /* Analyze a SIV (Single Index Variable) subscript where CHREC_A is a
1921    constant, and CHREC_B is an affine function.  *OVERLAPS_A and
1922    *OVERLAPS_B are initialized to the functions that describe the
1923    relation between the elements accessed twice by CHREC_A and
1924    CHREC_B.  For k >= 0, the following property is verified:
1925
1926    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
1927
1928 static void
1929 analyze_siv_subscript_cst_affine (tree chrec_a,
1930                                   tree chrec_b,
1931                                   conflict_function **overlaps_a,
1932                                   conflict_function **overlaps_b,
1933                                   tree *last_conflicts)
1934 {
1935   bool value0, value1, value2;
1936   tree type, difference, tmp;
1937
1938   type = signed_type_for_types (TREE_TYPE (chrec_a), TREE_TYPE (chrec_b));
1939   chrec_a = chrec_convert (type, chrec_a, NULL);
1940   chrec_b = chrec_convert (type, chrec_b, NULL);
1941   difference = chrec_fold_minus (type, initial_condition (chrec_b), chrec_a);
1942
1943   /* Special case overlap in the first iteration.  */
1944   if (integer_zerop (difference))
1945     {
1946       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1947       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
1948       *last_conflicts = integer_one_node;
1949       return;
1950     }
1951
1952   if (!chrec_is_positive (initial_condition (difference), &value0))
1953     {
1954       if (dump_file && (dump_flags & TDF_DETAILS))
1955         fprintf (dump_file, "siv test failed: chrec is not positive.\n");
1956
1957       dependence_stats.num_siv_unimplemented++;
1958       *overlaps_a = conflict_fn_not_known ();
1959       *overlaps_b = conflict_fn_not_known ();
1960       *last_conflicts = chrec_dont_know;
1961       return;
1962     }
1963   else
1964     {
1965       if (value0 == false)
1966         {
1967           if (!chrec_is_positive (CHREC_RIGHT (chrec_b), &value1))
1968             {
1969               if (dump_file && (dump_flags & TDF_DETAILS))
1970                 fprintf (dump_file, "siv test failed: chrec not positive.\n");
1971
1972               *overlaps_a = conflict_fn_not_known ();
1973               *overlaps_b = conflict_fn_not_known ();
1974               *last_conflicts = chrec_dont_know;
1975               dependence_stats.num_siv_unimplemented++;
1976               return;
1977             }
1978           else
1979             {
1980               if (value1 == true)
1981                 {
1982                   /* Example:
1983                      chrec_a = 12
1984                      chrec_b = {10, +, 1}
1985                   */
1986
1987                   if (tree_fold_divides_p (CHREC_RIGHT (chrec_b), difference))
1988                     {
1989                       HOST_WIDE_INT numiter;
1990                       struct loop *loop = get_chrec_loop (chrec_b);
1991
1992                       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1993                       tmp = fold_build2 (EXACT_DIV_EXPR, type,
1994                                          fold_build1 (ABS_EXPR, type, difference),
1995                                          CHREC_RIGHT (chrec_b));
1996                       *overlaps_b = conflict_fn (1, affine_fn_cst (tmp));
1997                       *last_conflicts = integer_one_node;
1998
1999
2000                       /* Perform weak-zero siv test to see if overlap is
2001                          outside the loop bounds.  */
2002                       numiter = max_stmt_executions_int (loop);
2003
2004                       if (numiter >= 0
2005                           && compare_tree_int (tmp, numiter) > 0)
2006                         {
2007                           free_conflict_function (*overlaps_a);
2008                           free_conflict_function (*overlaps_b);
2009                           *overlaps_a = conflict_fn_no_dependence ();
2010                           *overlaps_b = conflict_fn_no_dependence ();
2011                           *last_conflicts = integer_zero_node;
2012                           dependence_stats.num_siv_independent++;
2013                           return;
2014                         }
2015                       dependence_stats.num_siv_dependent++;
2016                       return;
2017                     }
2018
2019                   /* When the step does not divide the difference, there are
2020                      no overlaps.  */
2021                   else
2022                     {
2023                       *overlaps_a = conflict_fn_no_dependence ();
2024                       *overlaps_b = conflict_fn_no_dependence ();
2025                       *last_conflicts = integer_zero_node;
2026                       dependence_stats.num_siv_independent++;
2027                       return;
2028                     }
2029                 }
2030
2031               else
2032                 {
2033                   /* Example:
2034                      chrec_a = 12
2035                      chrec_b = {10, +, -1}
2036
2037                      In this case, chrec_a will not overlap with chrec_b.  */
2038                   *overlaps_a = conflict_fn_no_dependence ();
2039                   *overlaps_b = conflict_fn_no_dependence ();
2040                   *last_conflicts = integer_zero_node;
2041                   dependence_stats.num_siv_independent++;
2042                   return;
2043                 }
2044             }
2045         }
2046       else
2047         {
2048           if (!chrec_is_positive (CHREC_RIGHT (chrec_b), &value2))
2049             {
2050               if (dump_file && (dump_flags & TDF_DETAILS))
2051                 fprintf (dump_file, "siv test failed: chrec not positive.\n");
2052
2053               *overlaps_a = conflict_fn_not_known ();
2054               *overlaps_b = conflict_fn_not_known ();
2055               *last_conflicts = chrec_dont_know;
2056               dependence_stats.num_siv_unimplemented++;
2057               return;
2058             }
2059           else
2060             {
2061               if (value2 == false)
2062                 {
2063                   /* Example:
2064                      chrec_a = 3
2065                      chrec_b = {10, +, -1}
2066                   */
2067                   if (tree_fold_divides_p (CHREC_RIGHT (chrec_b), difference))
2068                     {
2069                       HOST_WIDE_INT numiter;
2070                       struct loop *loop = get_chrec_loop (chrec_b);
2071
2072                       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2073                       tmp = fold_build2 (EXACT_DIV_EXPR, type, difference,
2074                                          CHREC_RIGHT (chrec_b));
2075                       *overlaps_b = conflict_fn (1, affine_fn_cst (tmp));
2076                       *last_conflicts = integer_one_node;
2077
2078                       /* Perform weak-zero siv test to see if overlap is
2079                          outside the loop bounds.  */
2080                       numiter = max_stmt_executions_int (loop);
2081
2082                       if (numiter >= 0
2083                           && compare_tree_int (tmp, numiter) > 0)
2084                         {
2085                           free_conflict_function (*overlaps_a);
2086                           free_conflict_function (*overlaps_b);
2087                           *overlaps_a = conflict_fn_no_dependence ();
2088                           *overlaps_b = conflict_fn_no_dependence ();
2089                           *last_conflicts = integer_zero_node;
2090                           dependence_stats.num_siv_independent++;
2091                           return;
2092                         }
2093                       dependence_stats.num_siv_dependent++;
2094                       return;
2095                     }
2096
2097                   /* When the step does not divide the difference, there
2098                      are no overlaps.  */
2099                   else
2100                     {
2101                       *overlaps_a = conflict_fn_no_dependence ();
2102                       *overlaps_b = conflict_fn_no_dependence ();
2103                       *last_conflicts = integer_zero_node;
2104                       dependence_stats.num_siv_independent++;
2105                       return;
2106                     }
2107                 }
2108               else
2109                 {
2110                   /* Example:
2111                      chrec_a = 3
2112                      chrec_b = {4, +, 1}
2113
2114                      In this case, chrec_a will not overlap with chrec_b.  */
2115                   *overlaps_a = conflict_fn_no_dependence ();
2116                   *overlaps_b = conflict_fn_no_dependence ();
2117                   *last_conflicts = integer_zero_node;
2118                   dependence_stats.num_siv_independent++;
2119                   return;
2120                 }
2121             }
2122         }
2123     }
2124 }
2125
2126 /* Helper recursive function for initializing the matrix A.  Returns
2127    the initial value of CHREC.  */
2128
2129 static tree
2130 initialize_matrix_A (lambda_matrix A, tree chrec, unsigned index, int mult)
2131 {
2132   gcc_assert (chrec);
2133
2134   switch (TREE_CODE (chrec))
2135     {
2136     case POLYNOMIAL_CHREC:
2137       gcc_assert (TREE_CODE (CHREC_RIGHT (chrec)) == INTEGER_CST);
2138
2139       A[index][0] = mult * int_cst_value (CHREC_RIGHT (chrec));
2140       return initialize_matrix_A (A, CHREC_LEFT (chrec), index + 1, mult);
2141
2142     case PLUS_EXPR:
2143     case MULT_EXPR:
2144     case MINUS_EXPR:
2145       {
2146         tree op0 = initialize_matrix_A (A, TREE_OPERAND (chrec, 0), index, mult);
2147         tree op1 = initialize_matrix_A (A, TREE_OPERAND (chrec, 1), index, mult);
2148
2149         return chrec_fold_op (TREE_CODE (chrec), chrec_type (chrec), op0, op1);
2150       }
2151
2152     CASE_CONVERT:
2153       {
2154         tree op = initialize_matrix_A (A, TREE_OPERAND (chrec, 0), index, mult);
2155         return chrec_convert (chrec_type (chrec), op, NULL);
2156       }
2157
2158     case BIT_NOT_EXPR:
2159       {
2160         /* Handle ~X as -1 - X.  */
2161         tree op = initialize_matrix_A (A, TREE_OPERAND (chrec, 0), index, mult);
2162         return chrec_fold_op (MINUS_EXPR, chrec_type (chrec),
2163                               build_int_cst (TREE_TYPE (chrec), -1), op);
2164       }
2165
2166     case INTEGER_CST:
2167       return chrec;
2168
2169     default:
2170       gcc_unreachable ();
2171       return NULL_TREE;
2172     }
2173 }
2174
2175 #define FLOOR_DIV(x,y) ((x) / (y))
2176
2177 /* Solves the special case of the Diophantine equation:
2178    | {0, +, STEP_A}_x (OVERLAPS_A) = {0, +, STEP_B}_y (OVERLAPS_B)
2179
2180    Computes the descriptions OVERLAPS_A and OVERLAPS_B.  NITER is the
2181    number of iterations that loops X and Y run.  The overlaps will be
2182    constructed as evolutions in dimension DIM.  */
2183
2184 static void
2185 compute_overlap_steps_for_affine_univar (int niter, int step_a, int step_b,
2186                                          affine_fn *overlaps_a,
2187                                          affine_fn *overlaps_b,
2188                                          tree *last_conflicts, int dim)
2189 {
2190   if (((step_a > 0 && step_b > 0)
2191        || (step_a < 0 && step_b < 0)))
2192     {
2193       int step_overlaps_a, step_overlaps_b;
2194       int gcd_steps_a_b, last_conflict, tau2;
2195
2196       gcd_steps_a_b = gcd (step_a, step_b);
2197       step_overlaps_a = step_b / gcd_steps_a_b;
2198       step_overlaps_b = step_a / gcd_steps_a_b;
2199
2200       if (niter > 0)
2201         {
2202           tau2 = FLOOR_DIV (niter, step_overlaps_a);
2203           tau2 = MIN (tau2, FLOOR_DIV (niter, step_overlaps_b));
2204           last_conflict = tau2;
2205           *last_conflicts = build_int_cst (NULL_TREE, last_conflict);
2206         }
2207       else
2208         *last_conflicts = chrec_dont_know;
2209
2210       *overlaps_a = affine_fn_univar (integer_zero_node, dim,
2211                                       build_int_cst (NULL_TREE,
2212                                                      step_overlaps_a));
2213       *overlaps_b = affine_fn_univar (integer_zero_node, dim,
2214                                       build_int_cst (NULL_TREE,
2215                                                      step_overlaps_b));
2216     }
2217
2218   else
2219     {
2220       *overlaps_a = affine_fn_cst (integer_zero_node);
2221       *overlaps_b = affine_fn_cst (integer_zero_node);
2222       *last_conflicts = integer_zero_node;
2223     }
2224 }
2225
2226 /* Solves the special case of a Diophantine equation where CHREC_A is
2227    an affine bivariate function, and CHREC_B is an affine univariate
2228    function.  For example,
2229
2230    | {{0, +, 1}_x, +, 1335}_y = {0, +, 1336}_z
2231
2232    has the following overlapping functions:
2233
2234    | x (t, u, v) = {{0, +, 1336}_t, +, 1}_v
2235    | y (t, u, v) = {{0, +, 1336}_u, +, 1}_v
2236    | z (t, u, v) = {{{0, +, 1}_t, +, 1335}_u, +, 1}_v
2237
2238    FORNOW: This is a specialized implementation for a case occurring in
2239    a common benchmark.  Implement the general algorithm.  */
2240
2241 static void
2242 compute_overlap_steps_for_affine_1_2 (tree chrec_a, tree chrec_b,
2243                                       conflict_function **overlaps_a,
2244                                       conflict_function **overlaps_b,
2245                                       tree *last_conflicts)
2246 {
2247   bool xz_p, yz_p, xyz_p;
2248   int step_x, step_y, step_z;
2249   HOST_WIDE_INT niter_x, niter_y, niter_z, niter;
2250   affine_fn overlaps_a_xz, overlaps_b_xz;
2251   affine_fn overlaps_a_yz, overlaps_b_yz;
2252   affine_fn overlaps_a_xyz, overlaps_b_xyz;
2253   affine_fn ova1, ova2, ovb;
2254   tree last_conflicts_xz, last_conflicts_yz, last_conflicts_xyz;
2255
2256   step_x = int_cst_value (CHREC_RIGHT (CHREC_LEFT (chrec_a)));
2257   step_y = int_cst_value (CHREC_RIGHT (chrec_a));
2258   step_z = int_cst_value (CHREC_RIGHT (chrec_b));
2259
2260   niter_x = max_stmt_executions_int (get_chrec_loop (CHREC_LEFT (chrec_a)));
2261   niter_y = max_stmt_executions_int (get_chrec_loop (chrec_a));
2262   niter_z = max_stmt_executions_int (get_chrec_loop (chrec_b));
2263
2264   if (niter_x < 0 || niter_y < 0 || niter_z < 0)
2265     {
2266       if (dump_file && (dump_flags & TDF_DETAILS))
2267         fprintf (dump_file, "overlap steps test failed: no iteration counts.\n");
2268
2269       *overlaps_a = conflict_fn_not_known ();
2270       *overlaps_b = conflict_fn_not_known ();
2271       *last_conflicts = chrec_dont_know;
2272       return;
2273     }
2274
2275   niter = MIN (niter_x, niter_z);
2276   compute_overlap_steps_for_affine_univar (niter, step_x, step_z,
2277                                            &overlaps_a_xz,
2278                                            &overlaps_b_xz,
2279                                            &last_conflicts_xz, 1);
2280   niter = MIN (niter_y, niter_z);
2281   compute_overlap_steps_for_affine_univar (niter, step_y, step_z,
2282                                            &overlaps_a_yz,
2283                                            &overlaps_b_yz,
2284                                            &last_conflicts_yz, 2);
2285   niter = MIN (niter_x, niter_z);
2286   niter = MIN (niter_y, niter);
2287   compute_overlap_steps_for_affine_univar (niter, step_x + step_y, step_z,
2288                                            &overlaps_a_xyz,
2289                                            &overlaps_b_xyz,
2290                                            &last_conflicts_xyz, 3);
2291
2292   xz_p = !integer_zerop (last_conflicts_xz);
2293   yz_p = !integer_zerop (last_conflicts_yz);
2294   xyz_p = !integer_zerop (last_conflicts_xyz);
2295
2296   if (xz_p || yz_p || xyz_p)
2297     {
2298       ova1 = affine_fn_cst (integer_zero_node);
2299       ova2 = affine_fn_cst (integer_zero_node);
2300       ovb = affine_fn_cst (integer_zero_node);
2301       if (xz_p)
2302         {
2303           affine_fn t0 = ova1;
2304           affine_fn t2 = ovb;
2305
2306           ova1 = affine_fn_plus (ova1, overlaps_a_xz);
2307           ovb = affine_fn_plus (ovb, overlaps_b_xz);
2308           affine_fn_free (t0);
2309           affine_fn_free (t2);
2310           *last_conflicts = last_conflicts_xz;
2311         }
2312       if (yz_p)
2313         {
2314           affine_fn t0 = ova2;
2315           affine_fn t2 = ovb;
2316
2317           ova2 = affine_fn_plus (ova2, overlaps_a_yz);
2318           ovb = affine_fn_plus (ovb, overlaps_b_yz);
2319           affine_fn_free (t0);
2320           affine_fn_free (t2);
2321           *last_conflicts = last_conflicts_yz;
2322         }
2323       if (xyz_p)
2324         {
2325           affine_fn t0 = ova1;
2326           affine_fn t2 = ova2;
2327           affine_fn t4 = ovb;
2328
2329           ova1 = affine_fn_plus (ova1, overlaps_a_xyz);
2330           ova2 = affine_fn_plus (ova2, overlaps_a_xyz);
2331           ovb = affine_fn_plus (ovb, overlaps_b_xyz);
2332           affine_fn_free (t0);
2333           affine_fn_free (t2);
2334           affine_fn_free (t4);
2335           *last_conflicts = last_conflicts_xyz;
2336         }
2337       *overlaps_a = conflict_fn (2, ova1, ova2);
2338       *overlaps_b = conflict_fn (1, ovb);
2339     }
2340   else
2341     {
2342       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2343       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
2344       *last_conflicts = integer_zero_node;
2345     }
2346
2347   affine_fn_free (overlaps_a_xz);
2348   affine_fn_free (overlaps_b_xz);
2349   affine_fn_free (overlaps_a_yz);
2350   affine_fn_free (overlaps_b_yz);
2351   affine_fn_free (overlaps_a_xyz);
2352   affine_fn_free (overlaps_b_xyz);
2353 }
2354
2355 /* Copy the elements of vector VEC1 with length SIZE to VEC2.  */
2356
2357 static void
2358 lambda_vector_copy (lambda_vector vec1, lambda_vector vec2,
2359                     int size)
2360 {
2361   memcpy (vec2, vec1, size * sizeof (*vec1));
2362 }
2363
2364 /* Copy the elements of M x N matrix MAT1 to MAT2.  */
2365
2366 static void
2367 lambda_matrix_copy (lambda_matrix mat1, lambda_matrix mat2,
2368                     int m, int n)
2369 {
2370   int i;
2371
2372   for (i = 0; i < m; i++)
2373     lambda_vector_copy (mat1[i], mat2[i], n);
2374 }
2375
2376 /* Store the N x N identity matrix in MAT.  */
2377
2378 static void
2379 lambda_matrix_id (lambda_matrix mat, int size)
2380 {
2381   int i, j;
2382
2383   for (i = 0; i < size; i++)
2384     for (j = 0; j < size; j++)
2385       mat[i][j] = (i == j) ? 1 : 0;
2386 }
2387
2388 /* Return the first nonzero element of vector VEC1 between START and N.
2389    We must have START <= N.   Returns N if VEC1 is the zero vector.  */
2390
2391 static int
2392 lambda_vector_first_nz (lambda_vector vec1, int n, int start)
2393 {
2394   int j = start;
2395   while (j < n && vec1[j] == 0)
2396     j++;
2397   return j;
2398 }
2399
2400 /* Add a multiple of row R1 of matrix MAT with N columns to row R2:
2401    R2 = R2 + CONST1 * R1.  */
2402
2403 static void
2404 lambda_matrix_row_add (lambda_matrix mat, int n, int r1, int r2, int const1)
2405 {
2406   int i;
2407
2408   if (const1 == 0)
2409     return;
2410
2411   for (i = 0; i < n; i++)
2412     mat[r2][i] += const1 * mat[r1][i];
2413 }
2414
2415 /* Multiply vector VEC1 of length SIZE by a constant CONST1,
2416    and store the result in VEC2.  */
2417
2418 static void
2419 lambda_vector_mult_const (lambda_vector vec1, lambda_vector vec2,
2420                           int size, int const1)
2421 {
2422   int i;
2423
2424   if (const1 == 0)
2425     lambda_vector_clear (vec2, size);
2426   else
2427     for (i = 0; i < size; i++)
2428       vec2[i] = const1 * vec1[i];
2429 }
2430
2431 /* Negate vector VEC1 with length SIZE and store it in VEC2.  */
2432
2433 static void
2434 lambda_vector_negate (lambda_vector vec1, lambda_vector vec2,
2435                       int size)
2436 {
2437   lambda_vector_mult_const (vec1, vec2, size, -1);
2438 }
2439
2440 /* Negate row R1 of matrix MAT which has N columns.  */
2441
2442 static void
2443 lambda_matrix_row_negate (lambda_matrix mat, int n, int r1)
2444 {
2445   lambda_vector_negate (mat[r1], mat[r1], n);
2446 }
2447
2448 /* Return true if two vectors are equal.  */
2449
2450 static bool
2451 lambda_vector_equal (lambda_vector vec1, lambda_vector vec2, int size)
2452 {
2453   int i;
2454   for (i = 0; i < size; i++)
2455     if (vec1[i] != vec2[i])
2456       return false;
2457   return true;
2458 }
2459
2460 /* Given an M x N integer matrix A, this function determines an M x
2461    M unimodular matrix U, and an M x N echelon matrix S such that
2462    "U.A = S".  This decomposition is also known as "right Hermite".
2463
2464    Ref: Algorithm 2.1 page 33 in "Loop Transformations for
2465    Restructuring Compilers" Utpal Banerjee.  */
2466
2467 static void
2468 lambda_matrix_right_hermite (lambda_matrix A, int m, int n,
2469                              lambda_matrix S, lambda_matrix U)
2470 {
2471   int i, j, i0 = 0;
2472
2473   lambda_matrix_copy (A, S, m, n);
2474   lambda_matrix_id (U, m);
2475
2476   for (j = 0; j < n; j++)
2477     {
2478       if (lambda_vector_first_nz (S[j], m, i0) < m)
2479         {
2480           ++i0;
2481           for (i = m - 1; i >= i0; i--)
2482             {
2483               while (S[i][j] != 0)
2484                 {
2485                   int sigma, factor, a, b;
2486
2487                   a = S[i-1][j];
2488                   b = S[i][j];
2489                   sigma = (a * b < 0) ? -1: 1;
2490                   a = abs (a);
2491                   b = abs (b);
2492                   factor = sigma * (a / b);
2493
2494                   lambda_matrix_row_add (S, n, i, i-1, -factor);
2495                   std::swap (S[i], S[i-1]);
2496
2497                   lambda_matrix_row_add (U, m, i, i-1, -factor);
2498                   std::swap (U[i], U[i-1]);
2499                 }
2500             }
2501         }
2502     }
2503 }
2504
2505 /* Determines the overlapping elements due to accesses CHREC_A and
2506    CHREC_B, that are affine functions.  This function cannot handle
2507    symbolic evolution functions, ie. when initial conditions are
2508    parameters, because it uses lambda matrices of integers.  */
2509
2510 static void
2511 analyze_subscript_affine_affine (tree chrec_a,
2512                                  tree chrec_b,
2513                                  conflict_function **overlaps_a,
2514                                  conflict_function **overlaps_b,
2515                                  tree *last_conflicts)
2516 {
2517   unsigned nb_vars_a, nb_vars_b, dim;
2518   HOST_WIDE_INT init_a, init_b, gamma, gcd_alpha_beta;
2519   lambda_matrix A, U, S;
2520   struct obstack scratch_obstack;
2521
2522   if (eq_evolutions_p (chrec_a, chrec_b))
2523     {
2524       /* The accessed index overlaps for each iteration in the
2525          loop.  */
2526       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2527       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
2528       *last_conflicts = chrec_dont_know;
2529       return;
2530     }
2531   if (dump_file && (dump_flags & TDF_DETAILS))
2532     fprintf (dump_file, "(analyze_subscript_affine_affine \n");
2533
2534   /* For determining the initial intersection, we have to solve a
2535      Diophantine equation.  This is the most time consuming part.
2536
2537      For answering to the question: "Is there a dependence?" we have
2538      to prove that there exists a solution to the Diophantine
2539      equation, and that the solution is in the iteration domain,
2540      i.e. the solution is positive or zero, and that the solution
2541      happens before the upper bound loop.nb_iterations.  Otherwise
2542      there is no dependence.  This function outputs a description of
2543      the iterations that hold the intersections.  */
2544
2545   nb_vars_a = nb_vars_in_chrec (chrec_a);
2546   nb_vars_b = nb_vars_in_chrec (chrec_b);
2547
2548   gcc_obstack_init (&scratch_obstack);
2549
2550   dim = nb_vars_a + nb_vars_b;
2551   U = lambda_matrix_new (dim, dim, &scratch_obstack);
2552   A = lambda_matrix_new (dim, 1, &scratch_obstack);
2553   S = lambda_matrix_new (dim, 1, &scratch_obstack);
2554
2555   init_a = int_cst_value (initialize_matrix_A (A, chrec_a, 0, 1));
2556   init_b = int_cst_value (initialize_matrix_A (A, chrec_b, nb_vars_a, -1));
2557   gamma = init_b - init_a;
2558
2559   /* Don't do all the hard work of solving the Diophantine equation
2560      when we already know the solution: for example,
2561      | {3, +, 1}_1
2562      | {3, +, 4}_2
2563      | gamma = 3 - 3 = 0.
2564      Then the first overlap occurs during the first iterations:
2565      | {3, +, 1}_1 ({0, +, 4}_x) = {3, +, 4}_2 ({0, +, 1}_x)
2566   */
2567   if (gamma == 0)
2568     {
2569       if (nb_vars_a == 1 && nb_vars_b == 1)
2570         {
2571           HOST_WIDE_INT step_a, step_b;
2572           HOST_WIDE_INT niter, niter_a, niter_b;
2573           affine_fn ova, ovb;
2574
2575           niter_a = max_stmt_executions_int (get_chrec_loop (chrec_a));
2576           niter_b = max_stmt_executions_int (get_chrec_loop (chrec_b));
2577           niter = MIN (niter_a, niter_b);
2578           step_a = int_cst_value (CHREC_RIGHT (chrec_a));
2579           step_b = int_cst_value (CHREC_RIGHT (chrec_b));
2580
2581           compute_overlap_steps_for_affine_univar (niter, step_a, step_b,
2582                                                    &ova, &ovb,
2583                                                    last_conflicts, 1);
2584           *overlaps_a = conflict_fn (1, ova);
2585           *overlaps_b = conflict_fn (1, ovb);
2586         }
2587
2588       else if (nb_vars_a == 2 && nb_vars_b == 1)
2589         compute_overlap_steps_for_affine_1_2
2590           (chrec_a, chrec_b, overlaps_a, overlaps_b, last_conflicts);
2591
2592       else if (nb_vars_a == 1 && nb_vars_b == 2)
2593         compute_overlap_steps_for_affine_1_2
2594           (chrec_b, chrec_a, overlaps_b, overlaps_a, last_conflicts);
2595
2596       else
2597         {
2598           if (dump_file && (dump_flags & TDF_DETAILS))
2599             fprintf (dump_file, "affine-affine test failed: too many variables.\n");
2600           *overlaps_a = conflict_fn_not_known ();
2601           *overlaps_b = conflict_fn_not_known ();
2602           *last_conflicts = chrec_dont_know;
2603         }
2604       goto end_analyze_subs_aa;
2605     }
2606
2607   /* U.A = S */
2608   lambda_matrix_right_hermite (A, dim, 1, S, U);
2609
2610   if (S[0][0] < 0)
2611     {
2612       S[0][0] *= -1;
2613       lambda_matrix_row_negate (U, dim, 0);
2614     }
2615   gcd_alpha_beta = S[0][0];
2616
2617   /* Something went wrong: for example in {1, +, 0}_5 vs. {0, +, 0}_5,
2618      but that is a quite strange case.  Instead of ICEing, answer
2619      don't know.  */
2620   if (gcd_alpha_beta == 0)
2621     {
2622       *overlaps_a = conflict_fn_not_known ();
2623       *overlaps_b = conflict_fn_not_known ();
2624       *last_conflicts = chrec_dont_know;
2625       goto end_analyze_subs_aa;
2626     }
2627
2628   /* The classic "gcd-test".  */
2629   if (!int_divides_p (gcd_alpha_beta, gamma))
2630     {
2631       /* The "gcd-test" has determined that there is no integer
2632          solution, i.e. there is no dependence.  */
2633       *overlaps_a = conflict_fn_no_dependence ();
2634       *overlaps_b = conflict_fn_no_dependence ();
2635       *last_conflicts = integer_zero_node;
2636     }
2637
2638   /* Both access functions are univariate.  This includes SIV and MIV cases.  */
2639   else if (nb_vars_a == 1 && nb_vars_b == 1)
2640     {
2641       /* Both functions should have the same evolution sign.  */
2642       if (((A[0][0] > 0 && -A[1][0] > 0)
2643            || (A[0][0] < 0 && -A[1][0] < 0)))
2644         {
2645           /* The solutions are given by:
2646              |
2647              | [GAMMA/GCD_ALPHA_BETA  t].[u11 u12]  = [x0]
2648              |                           [u21 u22]    [y0]
2649
2650              For a given integer t.  Using the following variables,
2651
2652              | i0 = u11 * gamma / gcd_alpha_beta
2653              | j0 = u12 * gamma / gcd_alpha_beta
2654              | i1 = u21
2655              | j1 = u22
2656
2657              the solutions are:
2658
2659              | x0 = i0 + i1 * t,
2660              | y0 = j0 + j1 * t.  */
2661           HOST_WIDE_INT i0, j0, i1, j1;
2662
2663           i0 = U[0][0] * gamma / gcd_alpha_beta;
2664           j0 = U[0][1] * gamma / gcd_alpha_beta;
2665           i1 = U[1][0];
2666           j1 = U[1][1];
2667
2668           if ((i1 == 0 && i0 < 0)
2669               || (j1 == 0 && j0 < 0))
2670             {
2671               /* There is no solution.
2672                  FIXME: The case "i0 > nb_iterations, j0 > nb_iterations"
2673                  falls in here, but for the moment we don't look at the
2674                  upper bound of the iteration domain.  */
2675               *overlaps_a = conflict_fn_no_dependence ();
2676               *overlaps_b = conflict_fn_no_dependence ();
2677               *last_conflicts = integer_zero_node;
2678               goto end_analyze_subs_aa;
2679             }
2680
2681           if (i1 > 0 && j1 > 0)
2682             {
2683               HOST_WIDE_INT niter_a
2684                 = max_stmt_executions_int (get_chrec_loop (chrec_a));
2685               HOST_WIDE_INT niter_b
2686                 = max_stmt_executions_int (get_chrec_loop (chrec_b));
2687               HOST_WIDE_INT niter = MIN (niter_a, niter_b);
2688
2689               /* (X0, Y0) is a solution of the Diophantine equation:
2690                  "chrec_a (X0) = chrec_b (Y0)".  */
2691               HOST_WIDE_INT tau1 = MAX (CEIL (-i0, i1),
2692                                         CEIL (-j0, j1));
2693               HOST_WIDE_INT x0 = i1 * tau1 + i0;
2694               HOST_WIDE_INT y0 = j1 * tau1 + j0;
2695
2696               /* (X1, Y1) is the smallest positive solution of the eq
2697                  "chrec_a (X1) = chrec_b (Y1)", i.e. this is where the
2698                  first conflict occurs.  */
2699               HOST_WIDE_INT min_multiple = MIN (x0 / i1, y0 / j1);
2700               HOST_WIDE_INT x1 = x0 - i1 * min_multiple;
2701               HOST_WIDE_INT y1 = y0 - j1 * min_multiple;
2702
2703               if (niter > 0)
2704                 {
2705                   HOST_WIDE_INT tau2 = MIN (FLOOR_DIV (niter - i0, i1),
2706                                             FLOOR_DIV (niter - j0, j1));
2707                   HOST_WIDE_INT last_conflict = tau2 - (x1 - i0)/i1;
2708
2709                   /* If the overlap occurs outside of the bounds of the
2710                      loop, there is no dependence.  */
2711                   if (x1 >= niter || y1 >= niter)
2712                     {
2713                       *overlaps_a = conflict_fn_no_dependence ();
2714                       *overlaps_b = conflict_fn_no_dependence ();
2715                       *last_conflicts = integer_zero_node;
2716                       goto end_analyze_subs_aa;
2717                     }
2718                   else
2719                     *last_conflicts = build_int_cst (NULL_TREE, last_conflict);
2720                 }
2721               else
2722                 *last_conflicts = chrec_dont_know;
2723
2724               *overlaps_a
2725                 = conflict_fn (1,
2726                                affine_fn_univar (build_int_cst (NULL_TREE, x1),
2727                                                  1,
2728                                                  build_int_cst (NULL_TREE, i1)));
2729               *overlaps_b
2730                 = conflict_fn (1,
2731                                affine_fn_univar (build_int_cst (NULL_TREE, y1),
2732                                                  1,
2733                                                  build_int_cst (NULL_TREE, j1)));
2734             }
2735           else
2736             {
2737               /* FIXME: For the moment, the upper bound of the
2738                  iteration domain for i and j is not checked.  */
2739               if (dump_file && (dump_flags & TDF_DETAILS))
2740                 fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2741               *overlaps_a = conflict_fn_not_known ();
2742               *overlaps_b = conflict_fn_not_known ();
2743               *last_conflicts = chrec_dont_know;
2744             }
2745         }
2746       else
2747         {
2748           if (dump_file && (dump_flags & TDF_DETAILS))
2749             fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2750           *overlaps_a = conflict_fn_not_known ();
2751           *overlaps_b = conflict_fn_not_known ();
2752           *last_conflicts = chrec_dont_know;
2753         }
2754     }
2755   else
2756     {
2757       if (dump_file && (dump_flags & TDF_DETAILS))
2758         fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2759       *overlaps_a = conflict_fn_not_known ();
2760       *overlaps_b = conflict_fn_not_known ();
2761       *last_conflicts = chrec_dont_know;
2762     }
2763
2764 end_analyze_subs_aa:
2765   obstack_free (&scratch_obstack, NULL);
2766   if (dump_file && (dump_flags & TDF_DETAILS))
2767     {
2768       fprintf (dump_file, "  (overlaps_a = ");
2769       dump_conflict_function (dump_file, *overlaps_a);
2770       fprintf (dump_file, ")\n  (overlaps_b = ");
2771       dump_conflict_function (dump_file, *overlaps_b);
2772       fprintf (dump_file, "))\n");
2773     }
2774 }
2775
2776 /* Returns true when analyze_subscript_affine_affine can be used for
2777    determining the dependence relation between chrec_a and chrec_b,
2778    that contain symbols.  This function modifies chrec_a and chrec_b
2779    such that the analysis result is the same, and such that they don't
2780    contain symbols, and then can safely be passed to the analyzer.
2781
2782    Example: The analysis of the following tuples of evolutions produce
2783    the same results: {x+1, +, 1}_1 vs. {x+3, +, 1}_1, and {-2, +, 1}_1
2784    vs. {0, +, 1}_1
2785
2786    {x+1, +, 1}_1 ({2, +, 1}_1) = {x+3, +, 1}_1 ({0, +, 1}_1)
2787    {-2, +, 1}_1 ({2, +, 1}_1) = {0, +, 1}_1 ({0, +, 1}_1)
2788 */
2789
2790 static bool
2791 can_use_analyze_subscript_affine_affine (tree *chrec_a, tree *chrec_b)
2792 {
2793   tree diff, type, left_a, left_b, right_b;
2794
2795   if (chrec_contains_symbols (CHREC_RIGHT (*chrec_a))
2796       || chrec_contains_symbols (CHREC_RIGHT (*chrec_b)))
2797     /* FIXME: For the moment not handled.  Might be refined later.  */
2798     return false;
2799
2800   type = chrec_type (*chrec_a);
2801   left_a = CHREC_LEFT (*chrec_a);
2802   left_b = chrec_convert (type, CHREC_LEFT (*chrec_b), NULL);
2803   diff = chrec_fold_minus (type, left_a, left_b);
2804
2805   if (!evolution_function_is_constant_p (diff))
2806     return false;
2807
2808   if (dump_file && (dump_flags & TDF_DETAILS))
2809     fprintf (dump_file, "can_use_subscript_aff_aff_for_symbolic \n");
2810
2811   *chrec_a = build_polynomial_chrec (CHREC_VARIABLE (*chrec_a),
2812                                      diff, CHREC_RIGHT (*chrec_a));
2813   right_b = chrec_convert (type, CHREC_RIGHT (*chrec_b), NULL);
2814   *chrec_b = build_polynomial_chrec (CHREC_VARIABLE (*chrec_b),
2815                                      build_int_cst (type, 0),
2816                                      right_b);
2817   return true;
2818 }
2819
2820 /* Analyze a SIV (Single Index Variable) subscript.  *OVERLAPS_A and
2821    *OVERLAPS_B are initialized to the functions that describe the
2822    relation between the elements accessed twice by CHREC_A and
2823    CHREC_B.  For k >= 0, the following property is verified:
2824
2825    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
2826
2827 static void
2828 analyze_siv_subscript (tree chrec_a,
2829                        tree chrec_b,
2830                        conflict_function **overlaps_a,
2831                        conflict_function **overlaps_b,
2832                        tree *last_conflicts,
2833                        int loop_nest_num)
2834 {
2835   dependence_stats.num_siv++;
2836
2837   if (dump_file && (dump_flags & TDF_DETAILS))
2838     fprintf (dump_file, "(analyze_siv_subscript \n");
2839
2840   if (evolution_function_is_constant_p (chrec_a)
2841       && evolution_function_is_affine_in_loop (chrec_b, loop_nest_num))
2842     analyze_siv_subscript_cst_affine (chrec_a, chrec_b,
2843                                       overlaps_a, overlaps_b, last_conflicts);
2844
2845   else if (evolution_function_is_affine_in_loop (chrec_a, loop_nest_num)
2846            && evolution_function_is_constant_p (chrec_b))
2847     analyze_siv_subscript_cst_affine (chrec_b, chrec_a,
2848                                       overlaps_b, overlaps_a, last_conflicts);
2849
2850   else if (evolution_function_is_affine_in_loop (chrec_a, loop_nest_num)
2851            && evolution_function_is_affine_in_loop (chrec_b, loop_nest_num))
2852     {
2853       if (!chrec_contains_symbols (chrec_a)
2854           && !chrec_contains_symbols (chrec_b))
2855         {
2856           analyze_subscript_affine_affine (chrec_a, chrec_b,
2857                                            overlaps_a, overlaps_b,
2858                                            last_conflicts);
2859
2860           if (CF_NOT_KNOWN_P (*overlaps_a)
2861               || CF_NOT_KNOWN_P (*overlaps_b))
2862             dependence_stats.num_siv_unimplemented++;
2863           else if (CF_NO_DEPENDENCE_P (*overlaps_a)
2864                    || CF_NO_DEPENDENCE_P (*overlaps_b))
2865             dependence_stats.num_siv_independent++;
2866           else
2867             dependence_stats.num_siv_dependent++;
2868         }
2869       else if (can_use_analyze_subscript_affine_affine (&chrec_a,
2870                                                         &chrec_b))
2871         {
2872           analyze_subscript_affine_affine (chrec_a, chrec_b,
2873                                            overlaps_a, overlaps_b,
2874                                            last_conflicts);
2875
2876           if (CF_NOT_KNOWN_P (*overlaps_a)
2877               || CF_NOT_KNOWN_P (*overlaps_b))
2878             dependence_stats.num_siv_unimplemented++;
2879           else if (CF_NO_DEPENDENCE_P (*overlaps_a)
2880                    || CF_NO_DEPENDENCE_P (*overlaps_b))
2881             dependence_stats.num_siv_independent++;
2882           else
2883             dependence_stats.num_siv_dependent++;
2884         }
2885       else
2886         goto siv_subscript_dontknow;
2887     }
2888
2889   else
2890     {
2891     siv_subscript_dontknow:;
2892       if (dump_file && (dump_flags & TDF_DETAILS))
2893         fprintf (dump_file, "  siv test failed: unimplemented");
2894       *overlaps_a = conflict_fn_not_known ();
2895       *overlaps_b = conflict_fn_not_known ();
2896       *last_conflicts = chrec_dont_know;
2897       dependence_stats.num_siv_unimplemented++;
2898     }
2899
2900   if (dump_file && (dump_flags & TDF_DETAILS))
2901     fprintf (dump_file, ")\n");
2902 }
2903
2904 /* Returns false if we can prove that the greatest common divisor of the steps
2905    of CHREC does not divide CST, false otherwise.  */
2906
2907 static bool
2908 gcd_of_steps_may_divide_p (const_tree chrec, const_tree cst)
2909 {
2910   HOST_WIDE_INT cd = 0, val;
2911   tree step;
2912
2913   if (!tree_fits_shwi_p (cst))
2914     return true;
2915   val = tree_to_shwi (cst);
2916
2917   while (TREE_CODE (chrec) == POLYNOMIAL_CHREC)
2918     {
2919       step = CHREC_RIGHT (chrec);
2920       if (!tree_fits_shwi_p (step))
2921         return true;
2922       cd = gcd (cd, tree_to_shwi (step));
2923       chrec = CHREC_LEFT (chrec);
2924     }
2925
2926   return val % cd == 0;
2927 }
2928
2929 /* Analyze a MIV (Multiple Index Variable) subscript with respect to
2930    LOOP_NEST.  *OVERLAPS_A and *OVERLAPS_B are initialized to the
2931    functions that describe the relation between the elements accessed
2932    twice by CHREC_A and CHREC_B.  For k >= 0, the following property
2933    is verified:
2934
2935    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
2936
2937 static void
2938 analyze_miv_subscript (tree chrec_a,
2939                        tree chrec_b,
2940                        conflict_function **overlaps_a,
2941                        conflict_function **overlaps_b,
2942                        tree *last_conflicts,
2943                        struct loop *loop_nest)
2944 {
2945   tree type, difference;
2946
2947   dependence_stats.num_miv++;
2948   if (dump_file && (dump_flags & TDF_DETAILS))
2949     fprintf (dump_file, "(analyze_miv_subscript \n");
2950
2951   type = signed_type_for_types (TREE_TYPE (chrec_a), TREE_TYPE (chrec_b));
2952   chrec_a = chrec_convert (type, chrec_a, NULL);
2953   chrec_b = chrec_convert (type, chrec_b, NULL);
2954   difference = chrec_fold_minus (type, chrec_a, chrec_b);
2955
2956   if (eq_evolutions_p (chrec_a, chrec_b))
2957     {
2958       /* Access functions are the same: all the elements are accessed
2959          in the same order.  */
2960       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2961       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
2962       *last_conflicts = max_stmt_executions_tree (get_chrec_loop (chrec_a));
2963       dependence_stats.num_miv_dependent++;
2964     }
2965
2966   else if (evolution_function_is_constant_p (difference)
2967            /* For the moment, the following is verified:
2968               evolution_function_is_affine_multivariate_p (chrec_a,
2969               loop_nest->num) */
2970            && !gcd_of_steps_may_divide_p (chrec_a, difference))
2971     {
2972       /* testsuite/.../ssa-chrec-33.c
2973          {{21, +, 2}_1, +, -2}_2  vs.  {{20, +, 2}_1, +, -2}_2
2974
2975          The difference is 1, and all the evolution steps are multiples
2976          of 2, consequently there are no overlapping elements.  */
2977       *overlaps_a = conflict_fn_no_dependence ();
2978       *overlaps_b = conflict_fn_no_dependence ();
2979       *last_conflicts = integer_zero_node;
2980       dependence_stats.num_miv_independent++;
2981     }
2982
2983   else if (evolution_function_is_affine_multivariate_p (chrec_a, loop_nest->num)
2984            && !chrec_contains_symbols (chrec_a)
2985            && evolution_function_is_affine_multivariate_p (chrec_b, loop_nest->num)
2986            && !chrec_contains_symbols (chrec_b))
2987     {
2988       /* testsuite/.../ssa-chrec-35.c
2989          {0, +, 1}_2  vs.  {0, +, 1}_3
2990          the overlapping elements are respectively located at iterations:
2991          {0, +, 1}_x and {0, +, 1}_x,
2992          in other words, we have the equality:
2993          {0, +, 1}_2 ({0, +, 1}_x) = {0, +, 1}_3 ({0, +, 1}_x)
2994
2995          Other examples:
2996          {{0, +, 1}_1, +, 2}_2 ({0, +, 1}_x, {0, +, 1}_y) =
2997          {0, +, 1}_1 ({{0, +, 1}_x, +, 2}_y)
2998
2999          {{0, +, 2}_1, +, 3}_2 ({0, +, 1}_y, {0, +, 1}_x) =
3000          {{0, +, 3}_1, +, 2}_2 ({0, +, 1}_x, {0, +, 1}_y)
3001       */
3002       analyze_subscript_affine_affine (chrec_a, chrec_b,
3003                                        overlaps_a, overlaps_b, last_conflicts);
3004
3005       if (CF_NOT_KNOWN_P (*overlaps_a)
3006           || CF_NOT_KNOWN_P (*overlaps_b))
3007         dependence_stats.num_miv_unimplemented++;
3008       else if (CF_NO_DEPENDENCE_P (*overlaps_a)
3009                || CF_NO_DEPENDENCE_P (*overlaps_b))
3010         dependence_stats.num_miv_independent++;
3011       else
3012         dependence_stats.num_miv_dependent++;
3013     }
3014
3015   else
3016     {
3017       /* When the analysis is too difficult, answer "don't know".  */
3018       if (dump_file && (dump_flags & TDF_DETAILS))
3019         fprintf (dump_file, "analyze_miv_subscript test failed: unimplemented.\n");
3020
3021       *overlaps_a = conflict_fn_not_known ();
3022       *overlaps_b = conflict_fn_not_known ();
3023       *last_conflicts = chrec_dont_know;
3024       dependence_stats.num_miv_unimplemented++;
3025     }
3026
3027   if (dump_file && (dump_flags & TDF_DETAILS))
3028     fprintf (dump_file, ")\n");
3029 }
3030
3031 /* Determines the iterations for which CHREC_A is equal to CHREC_B in
3032    with respect to LOOP_NEST.  OVERLAP_ITERATIONS_A and
3033    OVERLAP_ITERATIONS_B are initialized with two functions that
3034    describe the iterations that contain conflicting elements.
3035
3036    Remark: For an integer k >= 0, the following equality is true:
3037
3038    CHREC_A (OVERLAP_ITERATIONS_A (k)) == CHREC_B (OVERLAP_ITERATIONS_B (k)).
3039 */
3040
3041 static void
3042 analyze_overlapping_iterations (tree chrec_a,
3043                                 tree chrec_b,
3044                                 conflict_function **overlap_iterations_a,
3045                                 conflict_function **overlap_iterations_b,
3046                                 tree *last_conflicts, struct loop *loop_nest)
3047 {
3048   unsigned int lnn = loop_nest->num;
3049
3050   dependence_stats.num_subscript_tests++;
3051
3052   if (dump_file && (dump_flags & TDF_DETAILS))
3053     {
3054       fprintf (dump_file, "(analyze_overlapping_iterations \n");
3055       fprintf (dump_file, "  (chrec_a = ");
3056       print_generic_expr (dump_file, chrec_a, 0);
3057       fprintf (dump_file, ")\n  (chrec_b = ");
3058       print_generic_expr (dump_file, chrec_b, 0);
3059       fprintf (dump_file, ")\n");
3060     }
3061
3062   if (chrec_a == NULL_TREE
3063       || chrec_b == NULL_TREE
3064       || chrec_contains_undetermined (chrec_a)
3065       || chrec_contains_undetermined (chrec_b))
3066     {
3067       dependence_stats.num_subscript_undetermined++;
3068
3069       *overlap_iterations_a = conflict_fn_not_known ();
3070       *overlap_iterations_b = conflict_fn_not_known ();
3071     }
3072
3073   /* If they are the same chrec, and are affine, they overlap
3074      on every iteration.  */
3075   else if (eq_evolutions_p (chrec_a, chrec_b)
3076            && (evolution_function_is_affine_multivariate_p (chrec_a, lnn)
3077                || operand_equal_p (chrec_a, chrec_b, 0)))
3078     {
3079       dependence_stats.num_same_subscript_function++;
3080       *overlap_iterations_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
3081       *overlap_iterations_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
3082       *last_conflicts = chrec_dont_know;
3083     }
3084
3085   /* If they aren't the same, and aren't affine, we can't do anything
3086      yet.  */
3087   else if ((chrec_contains_symbols (chrec_a)
3088             || chrec_contains_symbols (chrec_b))
3089            && (!evolution_function_is_affine_multivariate_p (chrec_a, lnn)
3090                || !evolution_function_is_affine_multivariate_p (chrec_b, lnn)))
3091     {
3092       dependence_stats.num_subscript_undetermined++;
3093       *overlap_iterations_a = conflict_fn_not_known ();
3094       *overlap_iterations_b = conflict_fn_not_known ();
3095     }
3096
3097   else if (ziv_subscript_p (chrec_a, chrec_b))
3098     analyze_ziv_subscript (chrec_a, chrec_b,
3099                            overlap_iterations_a, overlap_iterations_b,
3100                            last_conflicts);
3101
3102   else if (siv_subscript_p (chrec_a, chrec_b))
3103     analyze_siv_subscript (chrec_a, chrec_b,
3104                            overlap_iterations_a, overlap_iterations_b,
3105                            last_conflicts, lnn);
3106
3107   else
3108     analyze_miv_subscript (chrec_a, chrec_b,
3109                            overlap_iterations_a, overlap_iterations_b,
3110                            last_conflicts, loop_nest);
3111
3112   if (dump_file && (dump_flags & TDF_DETAILS))
3113     {
3114       fprintf (dump_file, "  (overlap_iterations_a = ");
3115       dump_conflict_function (dump_file, *overlap_iterations_a);
3116       fprintf (dump_file, ")\n  (overlap_iterations_b = ");
3117       dump_conflict_function (dump_file, *overlap_iterations_b);
3118       fprintf (dump_file, "))\n");
3119     }
3120 }
3121
3122 /* Helper function for uniquely inserting distance vectors.  */
3123
3124 static void
3125 save_dist_v (struct data_dependence_relation *ddr, lambda_vector dist_v)
3126 {
3127   unsigned i;
3128   lambda_vector v;
3129
3130   FOR_EACH_VEC_ELT (DDR_DIST_VECTS (ddr), i, v)
3131     if (lambda_vector_equal (v, dist_v, DDR_NB_LOOPS (ddr)))
3132       return;
3133
3134   DDR_DIST_VECTS (ddr).safe_push (dist_v);
3135 }
3136
3137 /* Helper function for uniquely inserting direction vectors.  */
3138
3139 static void
3140 save_dir_v (struct data_dependence_relation *ddr, lambda_vector dir_v)
3141 {
3142   unsigned i;
3143   lambda_vector v;
3144
3145   FOR_EACH_VEC_ELT (DDR_DIR_VECTS (ddr), i, v)
3146     if (lambda_vector_equal (v, dir_v, DDR_NB_LOOPS (ddr)))
3147       return;
3148
3149   DDR_DIR_VECTS (ddr).safe_push (dir_v);
3150 }
3151
3152 /* Add a distance of 1 on all the loops outer than INDEX.  If we
3153    haven't yet determined a distance for this outer loop, push a new
3154    distance vector composed of the previous distance, and a distance
3155    of 1 for this outer loop.  Example:
3156
3157    | loop_1
3158    |   loop_2
3159    |     A[10]
3160    |   endloop_2
3161    | endloop_1
3162
3163    Saved vectors are of the form (dist_in_1, dist_in_2).  First, we
3164    save (0, 1), then we have to save (1, 0).  */
3165
3166 static void
3167 add_outer_distances (struct data_dependence_relation *ddr,
3168                      lambda_vector dist_v, int index)
3169 {
3170   /* For each outer loop where init_v is not set, the accesses are
3171      in dependence of distance 1 in the loop.  */
3172   while (--index >= 0)
3173     {
3174       lambda_vector save_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3175       lambda_vector_copy (dist_v, save_v, DDR_NB_LOOPS (ddr));
3176       save_v[index] = 1;
3177       save_dist_v (ddr, save_v);
3178     }
3179 }
3180
3181 /* Return false when fail to represent the data dependence as a
3182    distance vector.  INIT_B is set to true when a component has been
3183    added to the distance vector DIST_V.  INDEX_CARRY is then set to
3184    the index in DIST_V that carries the dependence.  */
3185
3186 static bool
3187 build_classic_dist_vector_1 (struct data_dependence_relation *ddr,
3188                              struct data_reference *ddr_a,
3189                              struct data_reference *ddr_b,
3190                              lambda_vector dist_v, bool *init_b,
3191                              int *index_carry)
3192 {
3193   unsigned i;
3194   lambda_vector init_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3195
3196   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3197     {
3198       tree access_fn_a, access_fn_b;
3199       struct subscript *subscript = DDR_SUBSCRIPT (ddr, i);
3200
3201       if (chrec_contains_undetermined (SUB_DISTANCE (subscript)))
3202         {
3203           non_affine_dependence_relation (ddr);
3204           return false;
3205         }
3206
3207       access_fn_a = DR_ACCESS_FN (ddr_a, i);
3208       access_fn_b = DR_ACCESS_FN (ddr_b, i);
3209
3210       if (TREE_CODE (access_fn_a) == POLYNOMIAL_CHREC
3211           && TREE_CODE (access_fn_b) == POLYNOMIAL_CHREC)
3212         {
3213           int dist, index;
3214           int var_a = CHREC_VARIABLE (access_fn_a);
3215           int var_b = CHREC_VARIABLE (access_fn_b);
3216
3217           if (var_a != var_b
3218               || chrec_contains_undetermined (SUB_DISTANCE (subscript)))
3219             {
3220               non_affine_dependence_relation (ddr);
3221               return false;
3222             }
3223
3224           dist = int_cst_value (SUB_DISTANCE (subscript));
3225           index = index_in_loop_nest (var_a, DDR_LOOP_NEST (ddr));
3226           *index_carry = MIN (index, *index_carry);
3227
3228           /* This is the subscript coupling test.  If we have already
3229              recorded a distance for this loop (a distance coming from
3230              another subscript), it should be the same.  For example,
3231              in the following code, there is no dependence:
3232
3233              | loop i = 0, N, 1
3234              |   T[i+1][i] = ...
3235              |   ... = T[i][i]
3236              | endloop
3237           */
3238           if (init_v[index] != 0 && dist_v[index] != dist)
3239             {
3240               finalize_ddr_dependent (ddr, chrec_known);
3241               return false;
3242             }
3243
3244           dist_v[index] = dist;
3245           init_v[index] = 1;
3246           *init_b = true;
3247         }
3248       else if (!operand_equal_p (access_fn_a, access_fn_b, 0))
3249         {
3250           /* This can be for example an affine vs. constant dependence
3251              (T[i] vs. T[3]) that is not an affine dependence and is
3252              not representable as a distance vector.  */
3253           non_affine_dependence_relation (ddr);
3254           return false;
3255         }
3256     }
3257
3258   return true;
3259 }
3260
3261 /* Return true when the DDR contains only constant access functions.  */
3262
3263 static bool
3264 constant_access_functions (const struct data_dependence_relation *ddr)
3265 {
3266   unsigned i;
3267
3268   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3269     if (!evolution_function_is_constant_p (DR_ACCESS_FN (DDR_A (ddr), i))
3270         || !evolution_function_is_constant_p (DR_ACCESS_FN (DDR_B (ddr), i)))
3271       return false;
3272
3273   return true;
3274 }
3275
3276 /* Helper function for the case where DDR_A and DDR_B are the same
3277    multivariate access function with a constant step.  For an example
3278    see pr34635-1.c.  */
3279
3280 static void
3281 add_multivariate_self_dist (struct data_dependence_relation *ddr, tree c_2)
3282 {
3283   int x_1, x_2;
3284   tree c_1 = CHREC_LEFT (c_2);
3285   tree c_0 = CHREC_LEFT (c_1);
3286   lambda_vector dist_v;
3287   int v1, v2, cd;
3288
3289   /* Polynomials with more than 2 variables are not handled yet.  When
3290      the evolution steps are parameters, it is not possible to
3291      represent the dependence using classical distance vectors.  */
3292   if (TREE_CODE (c_0) != INTEGER_CST
3293       || TREE_CODE (CHREC_RIGHT (c_1)) != INTEGER_CST
3294       || TREE_CODE (CHREC_RIGHT (c_2)) != INTEGER_CST)
3295     {
3296       DDR_AFFINE_P (ddr) = false;
3297       return;
3298     }
3299
3300   x_2 = index_in_loop_nest (CHREC_VARIABLE (c_2), DDR_LOOP_NEST (ddr));
3301   x_1 = index_in_loop_nest (CHREC_VARIABLE (c_1), DDR_LOOP_NEST (ddr));
3302
3303   /* For "{{0, +, 2}_1, +, 3}_2" the distance vector is (3, -2).  */
3304   dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3305   v1 = int_cst_value (CHREC_RIGHT (c_1));
3306   v2 = int_cst_value (CHREC_RIGHT (c_2));
3307   cd = gcd (v1, v2);
3308   v1 /= cd;
3309   v2 /= cd;
3310
3311   if (v2 < 0)
3312     {
3313       v2 = -v2;
3314       v1 = -v1;
3315     }
3316
3317   dist_v[x_1] = v2;
3318   dist_v[x_2] = -v1;
3319   save_dist_v (ddr, dist_v);
3320
3321   add_outer_distances (ddr, dist_v, x_1);
3322 }
3323
3324 /* Helper function for the case where DDR_A and DDR_B are the same
3325    access functions.  */
3326
3327 static void
3328 add_other_self_distances (struct data_dependence_relation *ddr)
3329 {
3330   lambda_vector dist_v;
3331   unsigned i;
3332   int index_carry = DDR_NB_LOOPS (ddr);
3333
3334   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3335     {
3336       tree access_fun = DR_ACCESS_FN (DDR_A (ddr), i);
3337
3338       if (TREE_CODE (access_fun) == POLYNOMIAL_CHREC)
3339         {
3340           if (!evolution_function_is_univariate_p (access_fun))
3341             {
3342               if (DDR_NUM_SUBSCRIPTS (ddr) != 1)
3343                 {
3344                   DDR_ARE_DEPENDENT (ddr) = chrec_dont_know;
3345                   return;
3346                 }
3347
3348               access_fun = DR_ACCESS_FN (DDR_A (ddr), 0);
3349
3350               if (TREE_CODE (CHREC_LEFT (access_fun)) == POLYNOMIAL_CHREC)
3351                 add_multivariate_self_dist (ddr, access_fun);
3352               else
3353                 /* The evolution step is not constant: it varies in
3354                    the outer loop, so this cannot be represented by a
3355                    distance vector.  For example in pr34635.c the
3356                    evolution is {0, +, {0, +, 4}_1}_2.  */
3357                 DDR_AFFINE_P (ddr) = false;
3358
3359               return;
3360             }
3361
3362           index_carry = MIN (index_carry,
3363                              index_in_loop_nest (CHREC_VARIABLE (access_fun),
3364                                                  DDR_LOOP_NEST (ddr)));
3365         }
3366     }
3367
3368   dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3369   add_outer_distances (ddr, dist_v, index_carry);
3370 }
3371
3372 static void
3373 insert_innermost_unit_dist_vector (struct data_dependence_relation *ddr)
3374 {
3375   lambda_vector dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3376
3377   dist_v[DDR_INNER_LOOP (ddr)] = 1;
3378   save_dist_v (ddr, dist_v);
3379 }
3380
3381 /* Adds a unit distance vector to DDR when there is a 0 overlap.  This
3382    is the case for example when access functions are the same and
3383    equal to a constant, as in:
3384
3385    | loop_1
3386    |   A[3] = ...
3387    |   ... = A[3]
3388    | endloop_1
3389
3390    in which case the distance vectors are (0) and (1).  */
3391
3392 static void
3393 add_distance_for_zero_overlaps (struct data_dependence_relation *ddr)
3394 {
3395   unsigned i, j;
3396
3397   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3398     {
3399       subscript_p sub = DDR_SUBSCRIPT (ddr, i);
3400       conflict_function *ca = SUB_CONFLICTS_IN_A (sub);
3401       conflict_function *cb = SUB_CONFLICTS_IN_B (sub);
3402
3403       for (j = 0; j < ca->n; j++)
3404         if (affine_function_zero_p (ca->fns[j]))
3405           {
3406             insert_innermost_unit_dist_vector (ddr);
3407             return;
3408           }
3409
3410       for (j = 0; j < cb->n; j++)
3411         if (affine_function_zero_p (cb->fns[j]))
3412           {
3413             insert_innermost_unit_dist_vector (ddr);
3414             return;
3415           }
3416     }
3417 }
3418
3419 /* Compute the classic per loop distance vector.  DDR is the data
3420    dependence relation to build a vector from.  Return false when fail
3421    to represent the data dependence as a distance vector.  */
3422
3423 static bool
3424 build_classic_dist_vector (struct data_dependence_relation *ddr,
3425                            struct loop *loop_nest)
3426 {
3427   bool init_b = false;
3428   int index_carry = DDR_NB_LOOPS (ddr);
3429   lambda_vector dist_v;
3430
3431   if (DDR_ARE_DEPENDENT (ddr) != NULL_TREE)
3432     return false;
3433
3434   if (same_access_functions (ddr))
3435     {
3436       /* Save the 0 vector.  */
3437       dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3438       save_dist_v (ddr, dist_v);
3439
3440       if (constant_access_functions (ddr))
3441         add_distance_for_zero_overlaps (ddr);
3442
3443       if (DDR_NB_LOOPS (ddr) > 1)
3444         add_other_self_distances (ddr);
3445
3446       return true;
3447     }
3448
3449   dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3450   if (!build_classic_dist_vector_1 (ddr, DDR_A (ddr), DDR_B (ddr),
3451                                     dist_v, &init_b, &index_carry))
3452     return false;
3453
3454   /* Save the distance vector if we initialized one.  */
3455   if (init_b)
3456     {
3457       /* Verify a basic constraint: classic distance vectors should
3458          always be lexicographically positive.
3459
3460          Data references are collected in the order of execution of
3461          the program, thus for the following loop
3462
3463          | for (i = 1; i < 100; i++)
3464          |   for (j = 1; j < 100; j++)
3465          |     {
3466          |       t = T[j+1][i-1];  // A
3467          |       T[j][i] = t + 2;  // B
3468          |     }
3469
3470          references are collected following the direction of the wind:
3471          A then B.  The data dependence tests are performed also
3472          following this order, such that we're looking at the distance
3473          separating the elements accessed by A from the elements later
3474          accessed by B.  But in this example, the distance returned by
3475          test_dep (A, B) is lexicographically negative (-1, 1), that
3476          means that the access A occurs later than B with respect to
3477          the outer loop, ie. we're actually looking upwind.  In this
3478          case we solve test_dep (B, A) looking downwind to the
3479          lexicographically positive solution, that returns the
3480          distance vector (1, -1).  */
3481       if (!lambda_vector_lexico_pos (dist_v, DDR_NB_LOOPS (ddr)))
3482         {
3483           lambda_vector save_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3484           if (!subscript_dependence_tester_1 (ddr, DDR_B (ddr), DDR_A (ddr),
3485                                               loop_nest))
3486             return false;
3487           compute_subscript_distance (ddr);
3488           if (!build_classic_dist_vector_1 (ddr, DDR_B (ddr), DDR_A (ddr),
3489                                             save_v, &init_b, &index_carry))
3490             return false;
3491           save_dist_v (ddr, save_v);
3492           DDR_REVERSED_P (ddr) = true;
3493
3494           /* In this case there is a dependence forward for all the
3495              outer loops:
3496
3497              | for (k = 1; k < 100; k++)
3498              |  for (i = 1; i < 100; i++)
3499              |   for (j = 1; j < 100; j++)
3500              |     {
3501              |       t = T[j+1][i-1];  // A
3502              |       T[j][i] = t + 2;  // B
3503              |     }
3504
3505              the vectors are:
3506              (0,  1, -1)
3507              (1,  1, -1)
3508              (1, -1,  1)
3509           */
3510           if (DDR_NB_LOOPS (ddr) > 1)
3511             {
3512               add_outer_distances (ddr, save_v, index_carry);
3513               add_outer_distances (ddr, dist_v, index_carry);
3514             }
3515         }
3516       else
3517         {
3518           lambda_vector save_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3519           lambda_vector_copy (dist_v, save_v, DDR_NB_LOOPS (ddr));
3520
3521           if (DDR_NB_LOOPS (ddr) > 1)
3522             {
3523               lambda_vector opposite_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3524
3525               if (!subscript_dependence_tester_1 (ddr, DDR_B (ddr),
3526                                                   DDR_A (ddr), loop_nest))
3527                 return false;
3528               compute_subscript_distance (ddr);
3529               if (!build_classic_dist_vector_1 (ddr, DDR_B (ddr), DDR_A (ddr),
3530                                                 opposite_v, &init_b,
3531                                                 &index_carry))
3532                 return false;
3533
3534               save_dist_v (ddr, save_v);
3535               add_outer_distances (ddr, dist_v, index_carry);
3536               add_outer_distances (ddr, opposite_v, index_carry);
3537             }
3538           else
3539             save_dist_v (ddr, save_v);
3540         }
3541     }
3542   else
3543     {
3544       /* There is a distance of 1 on all the outer loops: Example:
3545          there is a dependence of distance 1 on loop_1 for the array A.
3546
3547          | loop_1
3548          |   A[5] = ...
3549          | endloop
3550       */
3551       add_outer_distances (ddr, dist_v,
3552                            lambda_vector_first_nz (dist_v,
3553                                                    DDR_NB_LOOPS (ddr), 0));
3554     }
3555
3556   if (dump_file && (dump_flags & TDF_DETAILS))
3557     {
3558       unsigned i;
3559
3560       fprintf (dump_file, "(build_classic_dist_vector\n");
3561       for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
3562         {
3563           fprintf (dump_file, "  dist_vector = (");
3564           print_lambda_vector (dump_file, DDR_DIST_VECT (ddr, i),
3565                                DDR_NB_LOOPS (ddr));
3566           fprintf (dump_file, "  )\n");
3567         }
3568       fprintf (dump_file, ")\n");
3569     }
3570
3571   return true;
3572 }
3573
3574 /* Return the direction for a given distance.
3575    FIXME: Computing dir this way is suboptimal, since dir can catch
3576    cases that dist is unable to represent.  */
3577
3578 static inline enum data_dependence_direction
3579 dir_from_dist (int dist)
3580 {
3581   if (dist > 0)
3582     return dir_positive;
3583   else if (dist < 0)
3584     return dir_negative;
3585   else
3586     return dir_equal;
3587 }
3588
3589 /* Compute the classic per loop direction vector.  DDR is the data
3590    dependence relation to build a vector from.  */
3591
3592 static void
3593 build_classic_dir_vector (struct data_dependence_relation *ddr)
3594 {
3595   unsigned i, j;
3596   lambda_vector dist_v;
3597
3598   FOR_EACH_VEC_ELT (DDR_DIST_VECTS (ddr), i, dist_v)
3599     {
3600       lambda_vector dir_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3601
3602       for (j = 0; j < DDR_NB_LOOPS (ddr); j++)
3603         dir_v[j] = dir_from_dist (dist_v[j]);
3604
3605       save_dir_v (ddr, dir_v);
3606     }
3607 }
3608
3609 /* Helper function.  Returns true when there is a dependence between
3610    data references DRA and DRB.  */
3611
3612 static bool
3613 subscript_dependence_tester_1 (struct data_dependence_relation *ddr,
3614                                struct data_reference *dra,
3615                                struct data_reference *drb,
3616                                struct loop *loop_nest)
3617 {
3618   unsigned int i;
3619   tree last_conflicts;
3620   struct subscript *subscript;
3621   tree res = NULL_TREE;
3622
3623   for (i = 0; DDR_SUBSCRIPTS (ddr).iterate (i, &subscript); i++)
3624     {
3625       conflict_function *overlaps_a, *overlaps_b;
3626
3627       analyze_overlapping_iterations (DR_ACCESS_FN (dra, i),
3628                                       DR_ACCESS_FN (drb, i),
3629                                       &overlaps_a, &overlaps_b,
3630                                       &last_conflicts, loop_nest);
3631
3632       if (SUB_CONFLICTS_IN_A (subscript))
3633         free_conflict_function (SUB_CONFLICTS_IN_A (subscript));
3634       if (SUB_CONFLICTS_IN_B (subscript))
3635         free_conflict_function (SUB_CONFLICTS_IN_B (subscript));
3636
3637       SUB_CONFLICTS_IN_A (subscript) = overlaps_a;
3638       SUB_CONFLICTS_IN_B (subscript) = overlaps_b;
3639       SUB_LAST_CONFLICT (subscript) = last_conflicts;
3640
3641       /* If there is any undetermined conflict function we have to
3642          give a conservative answer in case we cannot prove that
3643          no dependence exists when analyzing another subscript.  */
3644       if (CF_NOT_KNOWN_P (overlaps_a)
3645           || CF_NOT_KNOWN_P (overlaps_b))
3646         {
3647           res = chrec_dont_know;
3648           continue;
3649         }
3650
3651       /* When there is a subscript with no dependence we can stop.  */
3652       else if (CF_NO_DEPENDENCE_P (overlaps_a)
3653                || CF_NO_DEPENDENCE_P (overlaps_b))
3654         {
3655           res = chrec_known;
3656           break;
3657         }
3658     }
3659
3660   if (res == NULL_TREE)
3661     return true;
3662
3663   if (res == chrec_known)
3664     dependence_stats.num_dependence_independent++;
3665   else
3666     dependence_stats.num_dependence_undetermined++;
3667   finalize_ddr_dependent (ddr, res);
3668   return false;
3669 }
3670
3671 /* Computes the conflicting iterations in LOOP_NEST, and initialize DDR.  */
3672
3673 static void
3674 subscript_dependence_tester (struct data_dependence_relation *ddr,
3675                              struct loop *loop_nest)
3676 {
3677   if (subscript_dependence_tester_1 (ddr, DDR_A (ddr), DDR_B (ddr), loop_nest))
3678     dependence_stats.num_dependence_dependent++;
3679
3680   compute_subscript_distance (ddr);
3681   if (build_classic_dist_vector (ddr, loop_nest))
3682     build_classic_dir_vector (ddr);
3683 }
3684
3685 /* Returns true when all the access functions of A are affine or
3686    constant with respect to LOOP_NEST.  */
3687
3688 static bool
3689 access_functions_are_affine_or_constant_p (const struct data_reference *a,
3690                                            const struct loop *loop_nest)
3691 {
3692   unsigned int i;
3693   vec<tree> fns = DR_ACCESS_FNS (a);
3694   tree t;
3695
3696   FOR_EACH_VEC_ELT (fns, i, t)
3697     if (!evolution_function_is_invariant_p (t, loop_nest->num)
3698         && !evolution_function_is_affine_multivariate_p (t, loop_nest->num))
3699       return false;
3700
3701   return true;
3702 }
3703
3704 /* Initializes an equation for an OMEGA problem using the information
3705    contained in the ACCESS_FUN.  Returns true when the operation
3706    succeeded.
3707
3708    PB is the omega constraint system.
3709    EQ is the number of the equation to be initialized.
3710    OFFSET is used for shifting the variables names in the constraints:
3711    a constrain is composed of 2 * the number of variables surrounding
3712    dependence accesses.  OFFSET is set either to 0 for the first n variables,
3713    then it is set to n.
3714    ACCESS_FUN is expected to be an affine chrec.  */
3715
3716 static bool
3717 init_omega_eq_with_af (omega_pb pb, unsigned eq,
3718                        unsigned int offset, tree access_fun,
3719                        struct data_dependence_relation *ddr)
3720 {
3721   switch (TREE_CODE (access_fun))
3722     {
3723     case POLYNOMIAL_CHREC:
3724       {
3725         tree left = CHREC_LEFT (access_fun);
3726         tree right = CHREC_RIGHT (access_fun);
3727         int var = CHREC_VARIABLE (access_fun);
3728         unsigned var_idx;
3729
3730         if (TREE_CODE (right) != INTEGER_CST)
3731           return false;
3732
3733         var_idx = index_in_loop_nest (var, DDR_LOOP_NEST (ddr));
3734         pb->eqs[eq].coef[offset + var_idx + 1] = int_cst_value (right);
3735
3736         /* Compute the innermost loop index.  */
3737         DDR_INNER_LOOP (ddr) = MAX (DDR_INNER_LOOP (ddr), var_idx);
3738
3739         if (offset == 0)
3740           pb->eqs[eq].coef[var_idx + DDR_NB_LOOPS (ddr) + 1]
3741             += int_cst_value (right);
3742
3743         switch (TREE_CODE (left))
3744           {
3745           case POLYNOMIAL_CHREC:
3746             return init_omega_eq_with_af (pb, eq, offset, left, ddr);
3747
3748           case INTEGER_CST:
3749             pb->eqs[eq].coef[0] += int_cst_value (left);
3750             return true;
3751
3752           default:
3753             return false;
3754           }
3755       }
3756
3757     case INTEGER_CST:
3758       pb->eqs[eq].coef[0] += int_cst_value (access_fun);
3759       return true;
3760
3761     default:
3762       return false;
3763     }
3764 }
3765
3766 /* As explained in the comments preceding init_omega_for_ddr, we have
3767    to set up a system for each loop level, setting outer loops
3768    variation to zero, and current loop variation to positive or zero.
3769    Save each lexico positive distance vector.  */
3770
3771 static void
3772 omega_extract_distance_vectors (omega_pb pb,
3773                                 struct data_dependence_relation *ddr)
3774 {
3775   int eq, geq;
3776   unsigned i, j;
3777   struct loop *loopi, *loopj;
3778   enum omega_result res;
3779
3780   /* Set a new problem for each loop in the nest.  The basis is the
3781      problem that we have initialized until now.  On top of this we
3782      add new constraints.  */
3783   for (i = 0; i <= DDR_INNER_LOOP (ddr)
3784               && DDR_LOOP_NEST (ddr).iterate (i, &loopi); i++)
3785     {
3786       int dist = 0;
3787       omega_pb copy = omega_alloc_problem (2 * DDR_NB_LOOPS (ddr),
3788                                            DDR_NB_LOOPS (ddr));
3789
3790       omega_copy_problem (copy, pb);
3791
3792       /* For all the outer loops "loop_j", add "dj = 0".  */
3793       for (j = 0; j < i && DDR_LOOP_NEST (ddr).iterate (j, &loopj); j++)
3794         {
3795           eq = omega_add_zero_eq (copy, omega_black);
3796           copy->eqs[eq].coef[j + 1] = 1;
3797         }
3798
3799       /* For "loop_i", add "0 <= di".  */
3800       geq = omega_add_zero_geq (copy, omega_black);
3801       copy->geqs[geq].coef[i + 1] = 1;
3802
3803       /* Reduce the constraint system, and test that the current
3804          problem is feasible.  */
3805       res = omega_simplify_problem (copy);
3806       if (res == omega_false
3807           || res == omega_unknown
3808           || copy->num_geqs > (int) DDR_NB_LOOPS (ddr))
3809         goto next_problem;
3810
3811       for (eq = 0; eq < copy->num_subs; eq++)
3812         if (copy->subs[eq].key == (int) i + 1)
3813           {
3814             dist = copy->subs[eq].coef[0];
3815             goto found_dist;
3816           }
3817
3818       if (dist == 0)
3819         {
3820           /* Reinitialize problem...  */
3821           omega_copy_problem (copy, pb);
3822           for (j = 0; j < i && DDR_LOOP_NEST (ddr).iterate (j, &loopj); j++)
3823             {
3824               eq = omega_add_zero_eq (copy, omega_black);
3825               copy->eqs[eq].coef[j + 1] = 1;
3826             }
3827
3828           /* ..., but this time "di = 1".  */
3829           eq = omega_add_zero_eq (copy, omega_black);
3830           copy->eqs[eq].coef[i + 1] = 1;
3831           copy->eqs[eq].coef[0] = -1;
3832
3833           res = omega_simplify_problem (copy);
3834           if (res == omega_false
3835               || res == omega_unknown
3836               || copy->num_geqs > (int) DDR_NB_LOOPS (ddr))
3837             goto next_problem;
3838
3839           for (eq = 0; eq < copy->num_subs; eq++)
3840             if (copy->subs[eq].key == (int) i + 1)
3841               {
3842                 dist = copy->subs[eq].coef[0];
3843                 goto found_dist;
3844               }
3845         }
3846
3847     found_dist:;
3848       /* Save the lexicographically positive distance vector.  */
3849       if (dist >= 0)
3850         {
3851           lambda_vector dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3852           lambda_vector dir_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3853
3854           dist_v[i] = dist;
3855
3856           for (eq = 0; eq < copy->num_subs; eq++)
3857             if (copy->subs[eq].key > 0)
3858               {
3859                 dist = copy->subs[eq].coef[0];
3860                 dist_v[copy->subs[eq].key - 1] = dist;
3861               }
3862
3863           for (j = 0; j < DDR_NB_LOOPS (ddr); j++)
3864             dir_v[j] = dir_from_dist (dist_v[j]);
3865
3866           save_dist_v (ddr, dist_v);
3867           save_dir_v (ddr, dir_v);
3868         }
3869
3870     next_problem:;
3871       omega_free_problem (copy);
3872     }
3873 }
3874
3875 /* This is called for each subscript of a tuple of data references:
3876    insert an equality for representing the conflicts.  */
3877
3878 static bool
3879 omega_setup_subscript (tree access_fun_a, tree access_fun_b,
3880                        struct data_dependence_relation *ddr,
3881                        omega_pb pb, bool *maybe_dependent)
3882 {
3883   int eq;
3884   tree type = signed_type_for_types (TREE_TYPE (access_fun_a),
3885                                      TREE_TYPE (access_fun_b));
3886   tree fun_a = chrec_convert (type, access_fun_a, NULL);
3887   tree fun_b = chrec_convert (type, access_fun_b, NULL);
3888   tree difference = chrec_fold_minus (type, fun_a, fun_b);
3889   tree minus_one;
3890
3891   /* When the fun_a - fun_b is not constant, the dependence is not
3892      captured by the classic distance vector representation.  */
3893   if (TREE_CODE (difference) != INTEGER_CST)
3894     return false;
3895
3896   /* ZIV test.  */
3897   if (ziv_subscript_p (fun_a, fun_b) && !integer_zerop (difference))
3898     {
3899       /* There is no dependence.  */
3900       *maybe_dependent = false;
3901       return true;
3902     }
3903
3904   minus_one = build_int_cst (type, -1);
3905   fun_b = chrec_fold_multiply (type, fun_b, minus_one);
3906
3907   eq = omega_add_zero_eq (pb, omega_black);
3908   if (!init_omega_eq_with_af (pb, eq, DDR_NB_LOOPS (ddr), fun_a, ddr)
3909       || !init_omega_eq_with_af (pb, eq, 0, fun_b, ddr))
3910     /* There is probably a dependence, but the system of
3911        constraints cannot be built: answer "don't know".  */
3912     return false;
3913
3914   /* GCD test.  */
3915   if (DDR_NB_LOOPS (ddr) != 0 && pb->eqs[eq].coef[0]
3916       && !int_divides_p (lambda_vector_gcd
3917                          ((lambda_vector) &(pb->eqs[eq].coef[1]),
3918                           2 * DDR_NB_LOOPS (ddr)),
3919                          pb->eqs[eq].coef[0]))
3920     {
3921       /* There is no dependence.  */
3922       *maybe_dependent = false;
3923       return true;
3924     }
3925
3926   return true;
3927 }
3928
3929 /* Helper function, same as init_omega_for_ddr but specialized for
3930    data references A and B.  */
3931
3932 static bool
3933 init_omega_for_ddr_1 (struct data_reference *dra, struct data_reference *drb,
3934                       struct data_dependence_relation *ddr,
3935                       omega_pb pb, bool *maybe_dependent)
3936 {
3937   unsigned i;
3938   int ineq;
3939   struct loop *loopi;
3940   unsigned nb_loops = DDR_NB_LOOPS (ddr);
3941
3942   /* Insert an equality per subscript.  */
3943   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3944     {
3945       if (!omega_setup_subscript (DR_ACCESS_FN (dra, i), DR_ACCESS_FN (drb, i),
3946                                   ddr, pb, maybe_dependent))
3947         return false;
3948       else if (*maybe_dependent == false)
3949         {
3950           /* There is no dependence.  */
3951           DDR_ARE_DEPENDENT (ddr) = chrec_known;
3952           return true;
3953         }
3954     }
3955
3956   /* Insert inequalities: constraints corresponding to the iteration
3957      domain, i.e. the loops surrounding the references "loop_x" and
3958      the distance variables "dx".  The layout of the OMEGA
3959      representation is as follows:
3960      - coef[0] is the constant
3961      - coef[1..nb_loops] are the protected variables that will not be
3962      removed by the solver: the "dx"
3963      - coef[nb_loops + 1, 2*nb_loops] are the loop variables: "loop_x".
3964   */
3965   for (i = 0; i <= DDR_INNER_LOOP (ddr)
3966               && DDR_LOOP_NEST (ddr).iterate (i, &loopi); i++)
3967     {
3968       HOST_WIDE_INT nbi = max_stmt_executions_int (loopi);
3969
3970       /* 0 <= loop_x */
3971       ineq = omega_add_zero_geq (pb, omega_black);
3972       pb->geqs[ineq].coef[i + nb_loops + 1] = 1;
3973
3974       /* 0 <= loop_x + dx */
3975       ineq = omega_add_zero_geq (pb, omega_black);
3976       pb->geqs[ineq].coef[i + nb_loops + 1] = 1;
3977       pb->geqs[ineq].coef[i + 1] = 1;
3978
3979       if (nbi != -1)
3980         {
3981           /* loop_x <= nb_iters */
3982           ineq = omega_add_zero_geq (pb, omega_black);
3983           pb->geqs[ineq].coef[i + nb_loops + 1] = -1;
3984           pb->geqs[ineq].coef[0] = nbi;
3985
3986           /* loop_x + dx <= nb_iters */
3987           ineq = omega_add_zero_geq (pb, omega_black);
3988           pb->geqs[ineq].coef[i + nb_loops + 1] = -1;
3989           pb->geqs[ineq].coef[i + 1] = -1;
3990           pb->geqs[ineq].coef[0] = nbi;
3991
3992           /* A step "dx" bigger than nb_iters is not feasible, so
3993              add "0 <= nb_iters + dx",  */
3994           ineq = omega_add_zero_geq (pb, omega_black);
3995           pb->geqs[ineq].coef[i + 1] = 1;
3996           pb->geqs[ineq].coef[0] = nbi;
3997           /* and "dx <= nb_iters".  */
3998           ineq = omega_add_zero_geq (pb, omega_black);
3999           pb->geqs[ineq].coef[i + 1] = -1;
4000           pb->geqs[ineq].coef[0] = nbi;
4001         }
4002     }
4003
4004   omega_extract_distance_vectors (pb, ddr);
4005
4006   return true;
4007 }
4008
4009 /* Sets up the Omega dependence problem for the data dependence
4010    relation DDR.  Returns false when the constraint system cannot be
4011    built, ie. when the test answers "don't know".  Returns true
4012    otherwise, and when independence has been proved (using one of the
4013    trivial dependence test), set MAYBE_DEPENDENT to false, otherwise
4014    set MAYBE_DEPENDENT to true.
4015
4016    Example: for setting up the dependence system corresponding to the
4017    conflicting accesses
4018
4019    | loop_i
4020    |   loop_j
4021    |     A[i, i+1] = ...
4022    |     ... A[2*j, 2*(i + j)]
4023    |   endloop_j
4024    | endloop_i
4025
4026    the following constraints come from the iteration domain:
4027
4028    0 <= i <= Ni
4029    0 <= i + di <= Ni
4030    0 <= j <= Nj
4031    0 <= j + dj <= Nj
4032
4033    where di, dj are the distance variables.  The constraints
4034    representing the conflicting elements are:
4035
4036    i = 2 * (j + dj)
4037    i + 1 = 2 * (i + di + j + dj)
4038
4039    For asking that the resulting distance vector (di, dj) be
4040    lexicographically positive, we insert the constraint "di >= 0".  If
4041    "di = 0" in the solution, we fix that component to zero, and we
4042    look at the inner loops: we set a new problem where all the outer
4043    loop distances are zero, and fix this inner component to be
4044    positive.  When one of the components is positive, we save that
4045    distance, and set a new problem where the distance on this loop is
4046    zero, searching for other distances in the inner loops.  Here is
4047    the classic example that illustrates that we have to set for each
4048    inner loop a new problem:
4049
4050    | loop_1
4051    |   loop_2
4052    |     A[10]
4053    |   endloop_2
4054    | endloop_1
4055
4056    we have to save two distances (1, 0) and (0, 1).
4057
4058    Given two array references, refA and refB, we have to set the
4059    dependence problem twice, refA vs. refB and refB vs. refA, and we
4060    cannot do a single test, as refB might occur before refA in the
4061    inner loops, and the contrary when considering outer loops: ex.
4062
4063    | loop_0
4064    |   loop_1
4065    |     loop_2
4066    |       T[{1,+,1}_2][{1,+,1}_1]  // refA
4067    |       T[{2,+,1}_2][{0,+,1}_1]  // refB
4068    |     endloop_2
4069    |   endloop_1
4070    | endloop_0
4071
4072    refB touches the elements in T before refA, and thus for the same
4073    loop_0 refB precedes refA: ie. the distance vector (0, 1, -1)
4074    but for successive loop_0 iterations, we have (1, -1, 1)
4075
4076    The Omega solver expects the distance variables ("di" in the
4077    previous example) to come first in the constraint system (as
4078    variables to be protected, or "safe" variables), the constraint
4079    system is built using the following layout:
4080
4081    "cst | distance vars | index vars".
4082 */
4083
4084 static bool
4085 init_omega_for_ddr (struct data_dependence_relation *ddr,
4086                     bool *maybe_dependent)
4087 {
4088   omega_pb pb;
4089   bool res = false;
4090
4091   *maybe_dependent = true;
4092
4093   if (same_access_functions (ddr))
4094     {
4095       unsigned j;
4096       lambda_vector dir_v;
4097
4098       /* Save the 0 vector.  */
4099       save_dist_v (ddr, lambda_vector_new (DDR_NB_LOOPS (ddr)));
4100       dir_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
4101       for (j = 0; j < DDR_NB_LOOPS (ddr); j++)
4102         dir_v[j] = dir_equal;
4103       save_dir_v (ddr, dir_v);
4104
4105       /* Save the dependences carried by outer loops.  */
4106       pb = omega_alloc_problem (2 * DDR_NB_LOOPS (ddr), DDR_NB_LOOPS (ddr));
4107       res = init_omega_for_ddr_1 (DDR_A (ddr), DDR_B (ddr), ddr, pb,
4108                                   maybe_dependent);
4109       omega_free_problem (pb);
4110       return res;
4111     }
4112
4113   /* Omega expects the protected variables (those that have to be kept
4114      after elimination) to appear first in the constraint system.
4115      These variables are the distance variables.  In the following
4116      initialization we declare NB_LOOPS safe variables, and the total
4117      number of variables for the constraint system is 2*NB_LOOPS.  */
4118   pb = omega_alloc_problem (2 * DDR_NB_LOOPS (ddr), DDR_NB_LOOPS (ddr));
4119   res = init_omega_for_ddr_1 (DDR_A (ddr), DDR_B (ddr), ddr, pb,
4120                               maybe_dependent);
4121   omega_free_problem (pb);
4122
4123   /* Stop computation if not decidable, or no dependence.  */
4124   if (res == false || *maybe_dependent == false)
4125     return res;
4126
4127   pb = omega_alloc_problem (2 * DDR_NB_LOOPS (ddr), DDR_NB_LOOPS (ddr));
4128   res = init_omega_for_ddr_1 (DDR_B (ddr), DDR_A (ddr), ddr, pb,
4129                               maybe_dependent);
4130   omega_free_problem (pb);
4131
4132   return res;
4133 }
4134
4135 /* Return true when DDR contains the same information as that stored
4136    in DIR_VECTS and in DIST_VECTS, return false otherwise.   */
4137
4138 static bool
4139 ddr_consistent_p (FILE *file,
4140                   struct data_dependence_relation *ddr,
4141                   vec<lambda_vector> dist_vects,
4142                   vec<lambda_vector> dir_vects)
4143 {
4144   unsigned int i, j;
4145
4146   /* If dump_file is set, output there.  */
4147   if (dump_file && (dump_flags & TDF_DETAILS))
4148     file = dump_file;
4149
4150   if (dist_vects.length () != DDR_NUM_DIST_VECTS (ddr))
4151     {
4152       lambda_vector b_dist_v;
4153       fprintf (file, "\n(Number of distance vectors differ: Banerjee has %d, Omega has %d.\n",
4154                dist_vects.length (),
4155                DDR_NUM_DIST_VECTS (ddr));
4156
4157       fprintf (file, "Banerjee dist vectors:\n");
4158       FOR_EACH_VEC_ELT (dist_vects, i, b_dist_v)
4159         print_lambda_vector (file, b_dist_v, DDR_NB_LOOPS (ddr));
4160
4161       fprintf (file, "Omega dist vectors:\n");
4162       for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
4163         print_lambda_vector (file, DDR_DIST_VECT (ddr, i), DDR_NB_LOOPS (ddr));
4164
4165       fprintf (file, "data dependence relation:\n");
4166       dump_data_dependence_relation (file, ddr);
4167
4168       fprintf (file, ")\n");
4169       return false;
4170     }
4171
4172   if (dir_vects.length () != DDR_NUM_DIR_VECTS (ddr))
4173     {
4174       fprintf (file, "\n(Number of direction vectors differ: Banerjee has %d, Omega has %d.)\n",
4175                dir_vects.length (),
4176                DDR_NUM_DIR_VECTS (ddr));
4177       return false;
4178     }
4179
4180   for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
4181     {
4182       lambda_vector a_dist_v;
4183       lambda_vector b_dist_v = DDR_DIST_VECT (ddr, i);
4184
4185       /* Distance vectors are not ordered in the same way in the DDR
4186          and in the DIST_VECTS: search for a matching vector.  */
4187       FOR_EACH_VEC_ELT (dist_vects, j, a_dist_v)
4188         if (lambda_vector_equal (a_dist_v, b_dist_v, DDR_NB_LOOPS (ddr)))
4189           break;
4190
4191       if (j == dist_vects.length ())
4192         {
4193           fprintf (file, "\n(Dist vectors from the first dependence analyzer:\n");
4194           print_dist_vectors (file, dist_vects, DDR_NB_LOOPS (ddr));
4195           fprintf (file, "not found in Omega dist vectors:\n");
4196           print_dist_vectors (file, DDR_DIST_VECTS (ddr), DDR_NB_LOOPS (ddr));
4197           fprintf (file, "data dependence relation:\n");
4198           dump_data_dependence_relation (file, ddr);
4199           fprintf (file, ")\n");
4200         }
4201     }
4202
4203   for (i = 0; i < DDR_NUM_DIR_VECTS (ddr); i++)
4204     {
4205       lambda_vector a_dir_v;
4206       lambda_vector b_dir_v = DDR_DIR_VECT (ddr, i);
4207
4208       /* Direction vectors are not ordered in the same way in the DDR
4209          and in the DIR_VECTS: search for a matching vector.  */
4210       FOR_EACH_VEC_ELT (dir_vects, j, a_dir_v)
4211         if (lambda_vector_equal (a_dir_v, b_dir_v, DDR_NB_LOOPS (ddr)))
4212           break;
4213
4214       if (j == dist_vects.length ())
4215         {
4216           fprintf (file, "\n(Dir vectors from the first dependence analyzer:\n");
4217           print_dir_vectors (file, dir_vects, DDR_NB_LOOPS (ddr));
4218           fprintf (file, "not found in Omega dir vectors:\n");
4219           print_dir_vectors (file, DDR_DIR_VECTS (ddr), DDR_NB_LOOPS (ddr));
4220           fprintf (file, "data dependence relation:\n");
4221           dump_data_dependence_relation (file, ddr);
4222           fprintf (file, ")\n");
4223         }
4224     }
4225
4226   return true;
4227 }
4228
4229 /* This computes the affine dependence relation between A and B with
4230    respect to LOOP_NEST.  CHREC_KNOWN is used for representing the
4231    independence between two accesses, while CHREC_DONT_KNOW is used
4232    for representing the unknown relation.
4233
4234    Note that it is possible to stop the computation of the dependence
4235    relation the first time we detect a CHREC_KNOWN element for a given
4236    subscript.  */
4237
4238 void
4239 compute_affine_dependence (struct data_dependence_relation *ddr,
4240                            struct loop *loop_nest)
4241 {
4242   struct data_reference *dra = DDR_A (ddr);
4243   struct data_reference *drb = DDR_B (ddr);
4244
4245   if (dump_file && (dump_flags & TDF_DETAILS))
4246     {
4247       fprintf (dump_file, "(compute_affine_dependence\n");
4248       fprintf (dump_file, "  stmt_a: ");
4249       print_gimple_stmt (dump_file, DR_STMT (dra), 0, TDF_SLIM);
4250       fprintf (dump_file, "  stmt_b: ");
4251       print_gimple_stmt (dump_file, DR_STMT (drb), 0, TDF_SLIM);
4252     }
4253
4254   /* Analyze only when the dependence relation is not yet known.  */
4255   if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
4256     {
4257       dependence_stats.num_dependence_tests++;
4258
4259       if (access_functions_are_affine_or_constant_p (dra, loop_nest)
4260           && access_functions_are_affine_or_constant_p (drb, loop_nest))
4261         {
4262           subscript_dependence_tester (ddr, loop_nest);
4263
4264           if (flag_check_data_deps)
4265             {
4266               /* Dump the dependences from the first algorithm.  */
4267               if (dump_file && (dump_flags & TDF_DETAILS))
4268                 {
4269                   fprintf (dump_file, "\n\nBanerjee Analyzer\n");
4270                   dump_data_dependence_relation (dump_file, ddr);
4271                 }
4272
4273               if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
4274                 {
4275                   bool maybe_dependent;
4276                   vec<lambda_vector> dir_vects, dist_vects;
4277
4278                   /* Save the result of the first DD analyzer.  */
4279                   dist_vects = DDR_DIST_VECTS (ddr);
4280                   dir_vects = DDR_DIR_VECTS (ddr);
4281
4282                   /* Reset the information.  */
4283                   DDR_DIST_VECTS (ddr).create (0);
4284                   DDR_DIR_VECTS (ddr).create (0);
4285
4286                   /* Compute the same information using Omega.  */
4287                   if (!init_omega_for_ddr (ddr, &maybe_dependent))
4288                     goto csys_dont_know;
4289
4290                   if (dump_file && (dump_flags & TDF_DETAILS))
4291                     {
4292                       fprintf (dump_file, "Omega Analyzer\n");
4293                       dump_data_dependence_relation (dump_file, ddr);
4294                     }
4295
4296                   /* Check that we get the same information.  */
4297                   if (maybe_dependent)
4298                     gcc_assert (ddr_consistent_p (stderr, ddr, dist_vects,
4299                                                   dir_vects));
4300                 }
4301             }
4302         }
4303
4304       /* As a last case, if the dependence cannot be determined, or if
4305          the dependence is considered too difficult to determine, answer
4306          "don't know".  */
4307       else
4308         {
4309         csys_dont_know:;
4310           dependence_stats.num_dependence_undetermined++;
4311
4312           if (dump_file && (dump_flags & TDF_DETAILS))
4313             {
4314               fprintf (dump_file, "Data ref a:\n");
4315               dump_data_reference (dump_file, dra);
4316               fprintf (dump_file, "Data ref b:\n");
4317               dump_data_reference (dump_file, drb);
4318               fprintf (dump_file, "affine dependence test not usable: access function not affine or constant.\n");
4319             }
4320           finalize_ddr_dependent (ddr, chrec_dont_know);
4321         }
4322     }
4323
4324   if (dump_file && (dump_flags & TDF_DETAILS))
4325     {
4326       if (DDR_ARE_DEPENDENT (ddr) == chrec_known)
4327         fprintf (dump_file, ") -> no dependence\n");
4328       else if (DDR_ARE_DEPENDENT (ddr) == chrec_dont_know)
4329         fprintf (dump_file, ") -> dependence analysis failed\n");
4330       else
4331         fprintf (dump_file, ")\n");
4332     }
4333 }
4334
4335 /* Compute in DEPENDENCE_RELATIONS the data dependence graph for all
4336    the data references in DATAREFS, in the LOOP_NEST.  When
4337    COMPUTE_SELF_AND_RR is FALSE, don't compute read-read and self
4338    relations.  Return true when successful, i.e. data references number
4339    is small enough to be handled.  */
4340
4341 bool
4342 compute_all_dependences (vec<data_reference_p> datarefs,
4343                          vec<ddr_p> *dependence_relations,
4344                          vec<loop_p> loop_nest,
4345                          bool compute_self_and_rr)
4346 {
4347   struct data_dependence_relation *ddr;
4348   struct data_reference *a, *b;
4349   unsigned int i, j;
4350
4351   if ((int) datarefs.length ()
4352       > PARAM_VALUE (PARAM_LOOP_MAX_DATAREFS_FOR_DATADEPS))
4353     {
4354       struct data_dependence_relation *ddr;
4355
4356       /* Insert a single relation into dependence_relations:
4357          chrec_dont_know.  */
4358       ddr = initialize_data_dependence_relation (NULL, NULL, loop_nest);
4359       dependence_relations->safe_push (ddr);
4360       return false;
4361     }
4362
4363   FOR_EACH_VEC_ELT (datarefs, i, a)
4364     for (j = i + 1; datarefs.iterate (j, &b); j++)
4365       if (DR_IS_WRITE (a) || DR_IS_WRITE (b) || compute_self_and_rr)
4366         {
4367           ddr = initialize_data_dependence_relation (a, b, loop_nest);
4368           dependence_relations->safe_push (ddr);
4369           if (loop_nest.exists ())
4370             compute_affine_dependence (ddr, loop_nest[0]);
4371         }
4372
4373   if (compute_self_and_rr)
4374     FOR_EACH_VEC_ELT (datarefs, i, a)
4375       {
4376         ddr = initialize_data_dependence_relation (a, a, loop_nest);
4377         dependence_relations->safe_push (ddr);
4378         if (loop_nest.exists ())
4379           compute_affine_dependence (ddr, loop_nest[0]);
4380       }
4381
4382   return true;
4383 }
4384
4385 /* Describes a location of a memory reference.  */
4386
4387 typedef struct data_ref_loc_d
4388 {
4389   /* The memory reference.  */
4390   tree ref;
4391
4392   /* True if the memory reference is read.  */
4393   bool is_read;
4394 } data_ref_loc;
4395
4396
4397 /* Stores the locations of memory references in STMT to REFERENCES.  Returns
4398    true if STMT clobbers memory, false otherwise.  */
4399
4400 static bool
4401 get_references_in_stmt (gimple stmt, vec<data_ref_loc, va_heap> *references)
4402 {
4403   bool clobbers_memory = false;
4404   data_ref_loc ref;
4405   tree op0, op1;
4406   enum gimple_code stmt_code = gimple_code (stmt);
4407
4408   /* ASM_EXPR and CALL_EXPR may embed arbitrary side effects.
4409      As we cannot model data-references to not spelled out
4410      accesses give up if they may occur.  */
4411   if (stmt_code == GIMPLE_CALL
4412       && !(gimple_call_flags (stmt) & ECF_CONST))
4413     {
4414       /* Allow IFN_GOMP_SIMD_LANE in their own loops.  */
4415       if (gimple_call_internal_p (stmt))
4416         switch (gimple_call_internal_fn (stmt))
4417           {
4418           case IFN_GOMP_SIMD_LANE:
4419             {
4420               struct loop *loop = gimple_bb (stmt)->loop_father;
4421               tree uid = gimple_call_arg (stmt, 0);
4422               gcc_assert (TREE_CODE (uid) == SSA_NAME);
4423               if (loop == NULL
4424                   || loop->simduid != SSA_NAME_VAR (uid))
4425                 clobbers_memory = true;
4426               break;
4427             }
4428           case IFN_MASK_LOAD:
4429           case IFN_MASK_STORE:
4430             break;
4431           default:
4432             clobbers_memory = true;
4433             break;
4434           }
4435       else
4436         clobbers_memory = true;
4437     }
4438   else if (stmt_code == GIMPLE_ASM
4439            && (gimple_asm_volatile_p (as_a <gasm *> (stmt))
4440                || gimple_vuse (stmt)))
4441     clobbers_memory = true;
4442
4443   if (!gimple_vuse (stmt))
4444     return clobbers_memory;
4445
4446   if (stmt_code == GIMPLE_ASSIGN)
4447     {
4448       tree base;
4449       op0 = gimple_assign_lhs (stmt);
4450       op1 = gimple_assign_rhs1 (stmt);
4451
4452       if (DECL_P (op1)
4453           || (REFERENCE_CLASS_P (op1)
4454               && (base = get_base_address (op1))
4455               && TREE_CODE (base) != SSA_NAME))
4456         {
4457           ref.ref = op1;
4458           ref.is_read = true;
4459           references->safe_push (ref);
4460         }
4461     }
4462   else if (stmt_code == GIMPLE_CALL)
4463     {
4464       unsigned i, n;
4465
4466       ref.is_read = false;
4467       if (gimple_call_internal_p (stmt))
4468         switch (gimple_call_internal_fn (stmt))
4469           {
4470           case IFN_MASK_LOAD:
4471             if (gimple_call_lhs (stmt) == NULL_TREE)
4472               break;
4473             ref.is_read = true;
4474           case IFN_MASK_STORE:
4475             ref.ref = fold_build2 (MEM_REF,
4476                                    ref.is_read
4477                                    ? TREE_TYPE (gimple_call_lhs (stmt))
4478                                    : TREE_TYPE (gimple_call_arg (stmt, 3)),
4479                                    gimple_call_arg (stmt, 0),
4480                                    gimple_call_arg (stmt, 1));
4481             references->safe_push (ref);
4482             return false;
4483           default:
4484             break;
4485           }
4486
4487       op0 = gimple_call_lhs (stmt);
4488       n = gimple_call_num_args (stmt);
4489       for (i = 0; i < n; i++)
4490         {
4491           op1 = gimple_call_arg (stmt, i);
4492
4493           if (DECL_P (op1)
4494               || (REFERENCE_CLASS_P (op1) && get_base_address (op1)))
4495             {
4496               ref.ref = op1;
4497               ref.is_read = true;
4498               references->safe_push (ref);
4499             }
4500         }
4501     }
4502   else
4503     return clobbers_memory;
4504
4505   if (op0
4506       && (DECL_P (op0)
4507           || (REFERENCE_CLASS_P (op0) && get_base_address (op0))))
4508     {
4509       ref.ref = op0;
4510       ref.is_read = false;
4511       references->safe_push (ref);
4512     }
4513   return clobbers_memory;
4514 }
4515
4516 /* Stores the data references in STMT to DATAREFS.  If there is an unanalyzable
4517    reference, returns false, otherwise returns true.  NEST is the outermost
4518    loop of the loop nest in which the references should be analyzed.  */
4519
4520 bool
4521 find_data_references_in_stmt (struct loop *nest, gimple stmt,
4522                               vec<data_reference_p> *datarefs)
4523 {
4524   unsigned i;
4525   auto_vec<data_ref_loc, 2> references;
4526   data_ref_loc *ref;
4527   bool ret = true;
4528   data_reference_p dr;
4529
4530   if (get_references_in_stmt (stmt, &references))
4531     return false;
4532
4533   FOR_EACH_VEC_ELT (references, i, ref)
4534     {
4535       dr = create_data_ref (nest, loop_containing_stmt (stmt),
4536                             ref->ref, stmt, ref->is_read);
4537       gcc_assert (dr != NULL);
4538       datarefs->safe_push (dr);
4539     }
4540   references.release ();
4541   return ret;
4542 }
4543
4544 /* Stores the data references in STMT to DATAREFS.  If there is an
4545    unanalyzable reference, returns false, otherwise returns true.
4546    NEST is the outermost loop of the loop nest in which the references
4547    should be instantiated, LOOP is the loop in which the references
4548    should be analyzed.  */
4549
4550 bool
4551 graphite_find_data_references_in_stmt (loop_p nest, loop_p loop, gimple stmt,
4552                                        vec<data_reference_p> *datarefs)
4553 {
4554   unsigned i;
4555   auto_vec<data_ref_loc, 2> references;
4556   data_ref_loc *ref;
4557   bool ret = true;
4558   data_reference_p dr;
4559
4560   if (get_references_in_stmt (stmt, &references))
4561     return false;
4562
4563   FOR_EACH_VEC_ELT (references, i, ref)
4564     {
4565       dr = create_data_ref (nest, loop, ref->ref, stmt, ref->is_read);
4566       gcc_assert (dr != NULL);
4567       datarefs->safe_push (dr);
4568     }
4569
4570   references.release ();
4571   return ret;
4572 }
4573
4574 /* Search the data references in LOOP, and record the information into
4575    DATAREFS.  Returns chrec_dont_know when failing to analyze a
4576    difficult case, returns NULL_TREE otherwise.  */
4577
4578 tree
4579 find_data_references_in_bb (struct loop *loop, basic_block bb,
4580                             vec<data_reference_p> *datarefs)
4581 {
4582   gimple_stmt_iterator bsi;
4583
4584   for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
4585     {
4586       gimple stmt = gsi_stmt (bsi);
4587
4588       if (!find_data_references_in_stmt (loop, stmt, datarefs))
4589         {
4590           struct data_reference *res;
4591           res = XCNEW (struct data_reference);
4592           datarefs->safe_push (res);
4593
4594           return chrec_dont_know;
4595         }
4596     }
4597
4598   return NULL_TREE;
4599 }
4600
4601 /* Search the data references in LOOP, and record the information into
4602    DATAREFS.  Returns chrec_dont_know when failing to analyze a
4603    difficult case, returns NULL_TREE otherwise.
4604
4605    TODO: This function should be made smarter so that it can handle address
4606    arithmetic as if they were array accesses, etc.  */
4607
4608 tree
4609 find_data_references_in_loop (struct loop *loop,
4610                               vec<data_reference_p> *datarefs)
4611 {
4612   basic_block bb, *bbs;
4613   unsigned int i;
4614
4615   bbs = get_loop_body_in_dom_order (loop);
4616
4617   for (i = 0; i < loop->num_nodes; i++)
4618     {
4619       bb = bbs[i];
4620
4621       if (find_data_references_in_bb (loop, bb, datarefs) == chrec_dont_know)
4622         {
4623           free (bbs);
4624           return chrec_dont_know;
4625         }
4626     }
4627   free (bbs);
4628
4629   return NULL_TREE;
4630 }
4631
4632 /* Recursive helper function.  */
4633
4634 static bool
4635 find_loop_nest_1 (struct loop *loop, vec<loop_p> *loop_nest)
4636 {
4637   /* Inner loops of the nest should not contain siblings.  Example:
4638      when there are two consecutive loops,
4639
4640      | loop_0
4641      |   loop_1
4642      |     A[{0, +, 1}_1]
4643      |   endloop_1
4644      |   loop_2
4645      |     A[{0, +, 1}_2]
4646      |   endloop_2
4647      | endloop_0
4648
4649      the dependence relation cannot be captured by the distance
4650      abstraction.  */
4651   if (loop->next)
4652     return false;
4653
4654   loop_nest->safe_push (loop);
4655   if (loop->inner)
4656     return find_loop_nest_1 (loop->inner, loop_nest);
4657   return true;
4658 }
4659
4660 /* Return false when the LOOP is not well nested.  Otherwise return
4661    true and insert in LOOP_NEST the loops of the nest.  LOOP_NEST will
4662    contain the loops from the outermost to the innermost, as they will
4663    appear in the classic distance vector.  */
4664
4665 bool
4666 find_loop_nest (struct loop *loop, vec<loop_p> *loop_nest)
4667 {
4668   loop_nest->safe_push (loop);
4669   if (loop->inner)
4670     return find_loop_nest_1 (loop->inner, loop_nest);
4671   return true;
4672 }
4673
4674 /* Returns true when the data dependences have been computed, false otherwise.
4675    Given a loop nest LOOP, the following vectors are returned:
4676    DATAREFS is initialized to all the array elements contained in this loop,
4677    DEPENDENCE_RELATIONS contains the relations between the data references.
4678    Compute read-read and self relations if
4679    COMPUTE_SELF_AND_READ_READ_DEPENDENCES is TRUE.  */
4680
4681 bool
4682 compute_data_dependences_for_loop (struct loop *loop,
4683                                    bool compute_self_and_read_read_dependences,
4684                                    vec<loop_p> *loop_nest,
4685                                    vec<data_reference_p> *datarefs,
4686                                    vec<ddr_p> *dependence_relations)
4687 {
4688   bool res = true;
4689
4690   memset (&dependence_stats, 0, sizeof (dependence_stats));
4691
4692   /* If the loop nest is not well formed, or one of the data references
4693      is not computable, give up without spending time to compute other
4694      dependences.  */
4695   if (!loop
4696       || !find_loop_nest (loop, loop_nest)
4697       || find_data_references_in_loop (loop, datarefs) == chrec_dont_know
4698       || !compute_all_dependences (*datarefs, dependence_relations, *loop_nest,
4699                                    compute_self_and_read_read_dependences))
4700     res = false;
4701
4702   if (dump_file && (dump_flags & TDF_STATS))
4703     {
4704       fprintf (dump_file, "Dependence tester statistics:\n");
4705
4706       fprintf (dump_file, "Number of dependence tests: %d\n",
4707                dependence_stats.num_dependence_tests);
4708       fprintf (dump_file, "Number of dependence tests classified dependent: %d\n",
4709                dependence_stats.num_dependence_dependent);
4710       fprintf (dump_file, "Number of dependence tests classified independent: %d\n",
4711                dependence_stats.num_dependence_independent);
4712       fprintf (dump_file, "Number of undetermined dependence tests: %d\n",
4713                dependence_stats.num_dependence_undetermined);
4714
4715       fprintf (dump_file, "Number of subscript tests: %d\n",
4716                dependence_stats.num_subscript_tests);
4717       fprintf (dump_file, "Number of undetermined subscript tests: %d\n",
4718                dependence_stats.num_subscript_undetermined);
4719       fprintf (dump_file, "Number of same subscript function: %d\n",
4720                dependence_stats.num_same_subscript_function);
4721
4722       fprintf (dump_file, "Number of ziv tests: %d\n",
4723                dependence_stats.num_ziv);
4724       fprintf (dump_file, "Number of ziv tests returning dependent: %d\n",
4725                dependence_stats.num_ziv_dependent);
4726       fprintf (dump_file, "Number of ziv tests returning independent: %d\n",
4727                dependence_stats.num_ziv_independent);
4728       fprintf (dump_file, "Number of ziv tests unimplemented: %d\n",
4729                dependence_stats.num_ziv_unimplemented);
4730
4731       fprintf (dump_file, "Number of siv tests: %d\n",
4732                dependence_stats.num_siv);
4733       fprintf (dump_file, "Number of siv tests returning dependent: %d\n",
4734                dependence_stats.num_siv_dependent);
4735       fprintf (dump_file, "Number of siv tests returning independent: %d\n",
4736                dependence_stats.num_siv_independent);
4737       fprintf (dump_file, "Number of siv tests unimplemented: %d\n",
4738                dependence_stats.num_siv_unimplemented);
4739
4740       fprintf (dump_file, "Number of miv tests: %d\n",
4741                dependence_stats.num_miv);
4742       fprintf (dump_file, "Number of miv tests returning dependent: %d\n",
4743                dependence_stats.num_miv_dependent);
4744       fprintf (dump_file, "Number of miv tests returning independent: %d\n",
4745                dependence_stats.num_miv_independent);
4746       fprintf (dump_file, "Number of miv tests unimplemented: %d\n",
4747                dependence_stats.num_miv_unimplemented);
4748     }
4749
4750   return res;
4751 }
4752
4753 /* Returns true when the data dependences for the basic block BB have been
4754    computed, false otherwise.
4755    DATAREFS is initialized to all the array elements contained in this basic
4756    block, DEPENDENCE_RELATIONS contains the relations between the data
4757    references. Compute read-read and self relations if
4758    COMPUTE_SELF_AND_READ_READ_DEPENDENCES is TRUE.  */
4759 bool
4760 compute_data_dependences_for_bb (basic_block bb,
4761                                  bool compute_self_and_read_read_dependences,
4762                                  vec<data_reference_p> *datarefs,
4763                                  vec<ddr_p> *dependence_relations)
4764 {
4765   if (find_data_references_in_bb (NULL, bb, datarefs) == chrec_dont_know)
4766     return false;
4767
4768   return compute_all_dependences (*datarefs, dependence_relations, vNULL,
4769                                   compute_self_and_read_read_dependences);
4770 }
4771
4772 /* Entry point (for testing only).  Analyze all the data references
4773    and the dependence relations in LOOP.
4774
4775    The data references are computed first.
4776
4777    A relation on these nodes is represented by a complete graph.  Some
4778    of the relations could be of no interest, thus the relations can be
4779    computed on demand.
4780
4781    In the following function we compute all the relations.  This is
4782    just a first implementation that is here for:
4783    - for showing how to ask for the dependence relations,
4784    - for the debugging the whole dependence graph,
4785    - for the dejagnu testcases and maintenance.
4786
4787    It is possible to ask only for a part of the graph, avoiding to
4788    compute the whole dependence graph.  The computed dependences are
4789    stored in a knowledge base (KB) such that later queries don't
4790    recompute the same information.  The implementation of this KB is
4791    transparent to the optimizer, and thus the KB can be changed with a
4792    more efficient implementation, or the KB could be disabled.  */
4793 static void
4794 analyze_all_data_dependences (struct loop *loop)
4795 {
4796   unsigned int i;
4797   int nb_data_refs = 10;
4798   vec<data_reference_p> datarefs;
4799   datarefs.create (nb_data_refs);
4800   vec<ddr_p> dependence_relations;
4801   dependence_relations.create (nb_data_refs * nb_data_refs);
4802   vec<loop_p> loop_nest;
4803   loop_nest.create (3);
4804
4805   /* Compute DDs on the whole function.  */
4806   compute_data_dependences_for_loop (loop, false, &loop_nest, &datarefs,
4807                                      &dependence_relations);
4808
4809   if (dump_file)
4810     {
4811       dump_data_dependence_relations (dump_file, dependence_relations);
4812       fprintf (dump_file, "\n\n");
4813
4814       if (dump_flags & TDF_DETAILS)
4815         dump_dist_dir_vectors (dump_file, dependence_relations);
4816
4817       if (dump_flags & TDF_STATS)
4818         {
4819           unsigned nb_top_relations = 0;
4820           unsigned nb_bot_relations = 0;
4821           unsigned nb_chrec_relations = 0;
4822           struct data_dependence_relation *ddr;
4823
4824           FOR_EACH_VEC_ELT (dependence_relations, i, ddr)
4825             {
4826               if (chrec_contains_undetermined (DDR_ARE_DEPENDENT (ddr)))
4827                 nb_top_relations++;
4828
4829               else if (DDR_ARE_DEPENDENT (ddr) == chrec_known)
4830                 nb_bot_relations++;
4831
4832               else
4833                 nb_chrec_relations++;
4834             }
4835
4836           gather_stats_on_scev_database ();
4837         }
4838     }
4839
4840   loop_nest.release ();
4841   free_dependence_relations (dependence_relations);
4842   free_data_refs (datarefs);
4843 }
4844
4845 /* Computes all the data dependences and check that the results of
4846    several analyzers are the same.  */
4847
4848 void
4849 tree_check_data_deps (void)
4850 {
4851   struct loop *loop_nest;
4852
4853   FOR_EACH_LOOP (loop_nest, 0)
4854     analyze_all_data_dependences (loop_nest);
4855 }
4856
4857 /* Free the memory used by a data dependence relation DDR.  */
4858
4859 void
4860 free_dependence_relation (struct data_dependence_relation *ddr)
4861 {
4862   if (ddr == NULL)
4863     return;
4864
4865   if (DDR_SUBSCRIPTS (ddr).exists ())
4866     free_subscripts (DDR_SUBSCRIPTS (ddr));
4867   DDR_DIST_VECTS (ddr).release ();
4868   DDR_DIR_VECTS (ddr).release ();
4869
4870   free (ddr);
4871 }
4872
4873 /* Free the memory used by the data dependence relations from
4874    DEPENDENCE_RELATIONS.  */
4875
4876 void
4877 free_dependence_relations (vec<ddr_p> dependence_relations)
4878 {
4879   unsigned int i;
4880   struct data_dependence_relation *ddr;
4881
4882   FOR_EACH_VEC_ELT (dependence_relations, i, ddr)
4883     if (ddr)
4884       free_dependence_relation (ddr);
4885
4886   dependence_relations.release ();
4887 }
4888
4889 /* Free the memory used by the data references from DATAREFS.  */
4890
4891 void
4892 free_data_refs (vec<data_reference_p> datarefs)
4893 {
4894   unsigned int i;
4895   struct data_reference *dr;
4896
4897   FOR_EACH_VEC_ELT (datarefs, i, dr)
4898     free_data_ref (dr);
4899   datarefs.release ();
4900 }