gcc/tree-data-ref.c

   1 /* Data references and dependences detectors.
   2    Copyright (C) 2003, 2004, 2005, 2006, 2007 Free Software Foundation, Inc.
   3    Contributed by Sebastian Pop <pop@cri.ensmp.fr>
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 2, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING.  If not, write to the Free
  19 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
  20 02110-1301, USA.  */
  21
  22 /* This pass walks a given loop structure searching for array
  23    references.  The information about the array accesses is recorded
  24    in DATA_REFERENCE structures.
  25
  26    The basic test for determining the dependences is:
  27    given two access functions chrec1 and chrec2 to a same array, and
  28    x and y two vectors from the iteration domain, the same element of
  29    the array is accessed twice at iterations x and y if and only if:
  30    |             chrec1 (x) == chrec2 (y).
  31
  32    The goals of this analysis are:
  33
  34    - to determine the independence: the relation between two
  35      independent accesses is qualified with the chrec_known (this
  36      information allows a loop parallelization),
  37
  38    - when two data references access the same data, to qualify the
  39      dependence relation with classic dependence representations:
  40
  41        - distance vectors
  42        - direction vectors
  43        - loop carried level dependence
  44        - polyhedron dependence
  45      or with the chains of recurrences based representation,
  46
  47    - to define a knowledge base for storing the data dependence
  48      information,
  49
  50    - to define an interface to access this data.
  51
  52
  53    Definitions:
  54
  55    - subscript: given two array accesses a subscript is the tuple
  56    composed of the access functions for a given dimension.  Example:
  57    Given A[f1][f2][f3] and B[g1][g2][g3], there are three subscripts:
  58    (f1, g1), (f2, g2), (f3, g3).
  59
  60    - Diophantine equation: an equation whose coefficients and
  61    solutions are integer constants, for example the equation
  62    |   3*x + 2*y = 1
  63    has an integer solution x = 1 and y = -1.
  64
  65    References:
  66
  67    - "Advanced Compilation for High Performance Computing" by Randy
  68    Allen and Ken Kennedy.
  69    http://citeseer.ist.psu.edu/goff91practical.html
  70
  71    - "Loop Transformations for Restructuring Compilers - The Foundations"
  72    by Utpal Banerjee.
  73
  74
  75 */
  76
  77 #include "config.h"
  78 #include "system.h"
  79 #include "coretypes.h"
  80 #include "tm.h"
  81 #include "ggc.h"
  82 #include "tree.h"
  83
  84 /* These RTL headers are needed for basic-block.h.  */
  85 #include "rtl.h"
  86 #include "basic-block.h"
  87 #include "diagnostic.h"
  88 #include "tree-flow.h"
  89 #include "tree-dump.h"
  90 #include "timevar.h"
  91 #include "cfgloop.h"
  92 #include "tree-chrec.h"
  93 #include "tree-data-ref.h"
  94 #include "tree-scalar-evolution.h"
  95 #include "tree-pass.h"
  96 #include "langhooks.h"
  97
  98 static struct datadep_stats
  99 {
 100   int num_dependence_tests;
 101   int num_dependence_dependent;
 102   int num_dependence_independent;
 103   int num_dependence_undetermined;
 104
 105   int num_subscript_tests;
 106   int num_subscript_undetermined;
 107   int num_same_subscript_function;
 108
 109   int num_ziv;
 110   int num_ziv_independent;
 111   int num_ziv_dependent;
 112   int num_ziv_unimplemented;
 113
 114   int num_siv;
 115   int num_siv_independent;
 116   int num_siv_dependent;
 117   int num_siv_unimplemented;
 118
 119   int num_miv;
 120   int num_miv_independent;
 121   int num_miv_dependent;
 122   int num_miv_unimplemented;
 123 } dependence_stats;
 124
 125 static bool subscript_dependence_tester_1 (struct data_dependence_relation *,
 126                                            struct data_reference *,
 127                                            struct data_reference *);
 128 /* Returns true iff A divides B.  */
 129
 130 static inline bool
 131 tree_fold_divides_p (tree a, tree b)
 132 {
 133   gcc_assert (TREE_CODE (a) == INTEGER_CST);
 134   gcc_assert (TREE_CODE (b) == INTEGER_CST);
 135   return integer_zerop (int_const_binop (TRUNC_MOD_EXPR, b, a, 0));
 136 }
 137
 138 /* Returns true iff A divides B.  */
 139
 140 static inline bool
 141 int_divides_p (int a, int b)
 142 {
 143   return ((b % a) == 0);
 144 }
 145
 146 \f
 147
 148 /* Dump into FILE all the data references from DATAREFS.  */
 149
 150 void
 151 dump_data_references (FILE *file, VEC (data_reference_p, heap) *datarefs)
 152 {
 153   unsigned int i;
 154   struct data_reference *dr;
 155
 156   for (i = 0; VEC_iterate (data_reference_p, datarefs, i, dr); i++)
 157     dump_data_reference (file, dr);
 158 }
 159
 160 /* Dump into FILE all the dependence relations from DDRS.  */
 161
 162 void
 163 dump_data_dependence_relations (FILE *file,
 164                                 VEC (ddr_p, heap) *ddrs)
 165 {
 166   unsigned int i;
 167   struct data_dependence_relation *ddr;
 168
 169   for (i = 0; VEC_iterate (ddr_p, ddrs, i, ddr); i++)
 170     dump_data_dependence_relation (file, ddr);
 171 }
 172
 173 /* Dump function for a DATA_REFERENCE structure.  */
 174
 175 void
 176 dump_data_reference (FILE *outf,
 177                      struct data_reference *dr)
 178 {
 179   unsigned int i;
 180
 181   fprintf (outf, "(Data Ref: \n  stmt: ");
 182   print_generic_stmt (outf, DR_STMT (dr), 0);
 183   fprintf (outf, "  ref: ");
 184   print_generic_stmt (outf, DR_REF (dr), 0);
 185   fprintf (outf, "  base_object: ");
 186   print_generic_stmt (outf, DR_BASE_OBJECT (dr), 0);
 187
 188   for (i = 0; i < DR_NUM_DIMENSIONS (dr); i++)
 189     {
 190       fprintf (outf, "  Access function %d: ", i);
 191       print_generic_stmt (outf, DR_ACCESS_FN (dr, i), 0);
 192     }
 193   fprintf (outf, ")\n");
 194 }
 195
 196 /* Dumps the affine function described by FN to the file OUTF.  */
 197
 198 static void
 199 dump_affine_function (FILE *outf, affine_fn fn)
 200 {
 201   unsigned i;
 202   tree coef;
 203
 204   print_generic_expr (outf, VEC_index (tree, fn, 0), TDF_SLIM);
 205   for (i = 1; VEC_iterate (tree, fn, i, coef); i++)
 206     {
 207       fprintf (outf, " + ");
 208       print_generic_expr (outf, coef, TDF_SLIM);
 209       fprintf (outf, " * x_%u", i);
 210     }
 211 }
 212
 213 /* Dumps the conflict function CF to the file OUTF.  */
 214
 215 static void
 216 dump_conflict_function (FILE *outf, conflict_function *cf)
 217 {
 218   unsigned i;
 219
 220   if (cf->n == NO_DEPENDENCE)
 221     fprintf (outf, "no dependence\n");
 222   else if (cf->n == NOT_KNOWN)
 223     fprintf (outf, "not known\n");
 224   else
 225     {
 226       for (i = 0; i < cf->n; i++)
 227         {
 228           fprintf (outf, "[");
 229           dump_affine_function (outf, cf->fns[i]);
 230           fprintf (outf, "]\n");
 231         }
 232     }
 233 }
 234
 235 /* Dump function for a SUBSCRIPT structure.  */
 236
 237 void
 238 dump_subscript (FILE *outf, struct subscript *subscript)
 239 {
 240   conflict_function *cf = SUB_CONFLICTS_IN_A (subscript);
 241
 242   fprintf (outf, "\n (subscript \n");
 243   fprintf (outf, "  iterations_that_access_an_element_twice_in_A: ");
 244   dump_conflict_function (outf, cf);
 245   if (CF_NONTRIVIAL_P (cf))
 246     {
 247       tree last_iteration = SUB_LAST_CONFLICT (subscript);
 248       fprintf (outf, "  last_conflict: ");
 249       print_generic_stmt (outf, last_iteration, 0);
 250     }
 251
 252   cf = SUB_CONFLICTS_IN_B (subscript);
 253   fprintf (outf, "  iterations_that_access_an_element_twice_in_B: ");
 254   dump_conflict_function (outf, cf);
 255   if (CF_NONTRIVIAL_P (cf))
 256     {
 257       tree last_iteration = SUB_LAST_CONFLICT (subscript);
 258       fprintf (outf, "  last_conflict: ");
 259       print_generic_stmt (outf, last_iteration, 0);
 260     }
 261
 262   fprintf (outf, "  (Subscript distance: ");
 263   print_generic_stmt (outf, SUB_DISTANCE (subscript), 0);
 264   fprintf (outf, "  )\n");
 265   fprintf (outf, " )\n");
 266 }
 267
 268 /* Print the classic direction vector DIRV to OUTF.  */
 269
 270 void
 271 print_direction_vector (FILE *outf,
 272                         lambda_vector dirv,
 273                         int length)
 274 {
 275   int eq;
 276
 277   for (eq = 0; eq < length; eq++)
 278     {
 279       enum data_dependence_direction dir = dirv[eq];
 280
 281       switch (dir)
 282         {
 283         case dir_positive:
 284           fprintf (outf, "    +");
 285           break;
 286         case dir_negative:
 287           fprintf (outf, "    -");
 288           break;
 289         case dir_equal:
 290           fprintf (outf, "    =");
 291           break;
 292         case dir_positive_or_equal:
 293           fprintf (outf, "   +=");
 294           break;
 295         case dir_positive_or_negative:
 296           fprintf (outf, "   +-");
 297           break;
 298         case dir_negative_or_equal:
 299           fprintf (outf, "   -=");
 300           break;
 301         case dir_star:
 302           fprintf (outf, "    *");
 303           break;
 304         default:
 305           fprintf (outf, "indep");
 306           break;
 307         }
 308     }
 309   fprintf (outf, "\n");
 310 }
 311
 312 /* Print a vector of direction vectors.  */
 313
 314 void
 315 print_dir_vectors (FILE *outf, VEC (lambda_vector, heap) *dir_vects,
 316                    int length)
 317 {
 318   unsigned j;
 319   lambda_vector v;
 320
 321   for (j = 0; VEC_iterate (lambda_vector, dir_vects, j, v); j++)
 322     print_direction_vector (outf, v, length);
 323 }
 324
 325 /* Print a vector of distance vectors.  */
 326
 327 void
 328 print_dist_vectors  (FILE *outf, VEC (lambda_vector, heap) *dist_vects,
 329                      int length)
 330 {
 331   unsigned j;
 332   lambda_vector v;
 333
 334   for (j = 0; VEC_iterate (lambda_vector, dist_vects, j, v); j++)
 335     print_lambda_vector (outf, v, length);
 336 }
 337
 338 /* Debug version.  */
 339
 340 void
 341 debug_data_dependence_relation (struct data_dependence_relation *ddr)
 342 {
 343   dump_data_dependence_relation (stderr, ddr);
 344 }
 345
 346 /* Dump function for a DATA_DEPENDENCE_RELATION structure.  */
 347
 348 void
 349 dump_data_dependence_relation (FILE *outf,
 350                                struct data_dependence_relation *ddr)
 351 {
 352   struct data_reference *dra, *drb;
 353
 354   dra = DDR_A (ddr);
 355   drb = DDR_B (ddr);
 356   fprintf (outf, "(Data Dep: \n");
 357   if (DDR_ARE_DEPENDENT (ddr) == chrec_dont_know)
 358     fprintf (outf, "    (don't know)\n");
 359
 360   else if (DDR_ARE_DEPENDENT (ddr) == chrec_known)
 361     fprintf (outf, "    (no dependence)\n");
 362
 363   else if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
 364     {
 365       unsigned int i;
 366       struct loop *loopi;
 367
 368       for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
 369         {
 370           fprintf (outf, "  access_fn_A: ");
 371           print_generic_stmt (outf, DR_ACCESS_FN (dra, i), 0);
 372           fprintf (outf, "  access_fn_B: ");
 373           print_generic_stmt (outf, DR_ACCESS_FN (drb, i), 0);
 374           dump_subscript (outf, DDR_SUBSCRIPT (ddr, i));
 375         }
 376
 377       fprintf (outf, "  inner loop index: %d\n", DDR_INNER_LOOP (ddr));
 378       fprintf (outf, "  loop nest: (");
 379       for (i = 0; VEC_iterate (loop_p, DDR_LOOP_NEST (ddr), i, loopi); i++)
 380         fprintf (outf, "%d ", loopi->num);
 381       fprintf (outf, ")\n");
 382
 383       for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
 384         {
 385           fprintf (outf, "  distance_vector: ");
 386           print_lambda_vector (outf, DDR_DIST_VECT (ddr, i),
 387                                DDR_NB_LOOPS (ddr));
 388         }
 389
 390       for (i = 0; i < DDR_NUM_DIR_VECTS (ddr); i++)
 391         {
 392           fprintf (outf, "  direction_vector: ");
 393           print_direction_vector (outf, DDR_DIR_VECT (ddr, i),
 394                                   DDR_NB_LOOPS (ddr));
 395         }
 396     }
 397
 398   fprintf (outf, ")\n");
 399 }
 400
 401 /* Dump function for a DATA_DEPENDENCE_DIRECTION structure.  */
 402
 403 void
 404 dump_data_dependence_direction (FILE *file,
 405                                 enum data_dependence_direction dir)
 406 {
 407   switch (dir)
 408     {
 409     case dir_positive:
 410       fprintf (file, "+");
 411       break;
 412
 413     case dir_negative:
 414       fprintf (file, "-");
 415       break;
 416
 417     case dir_equal:
 418       fprintf (file, "=");
 419       break;
 420
 421     case dir_positive_or_negative:
 422       fprintf (file, "+-");
 423       break;
 424
 425     case dir_positive_or_equal:
 426       fprintf (file, "+=");
 427       break;
 428
 429     case dir_negative_or_equal:
 430       fprintf (file, "-=");
 431       break;
 432
 433     case dir_star:
 434       fprintf (file, "*");
 435       break;
 436
 437     default:
 438       break;
 439     }
 440 }
 441
 442 /* Dumps the distance and direction vectors in FILE.  DDRS contains
 443    the dependence relations, and VECT_SIZE is the size of the
 444    dependence vectors, or in other words the number of loops in the
 445    considered nest.  */
 446
 447 void
 448 dump_dist_dir_vectors (FILE *file, VEC (ddr_p, heap) *ddrs)
 449 {
 450   unsigned int i, j;
 451   struct data_dependence_relation *ddr;
 452   lambda_vector v;
 453
 454   for (i = 0; VEC_iterate (ddr_p, ddrs, i, ddr); i++)
 455     if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE && DDR_AFFINE_P (ddr))
 456       {
 457         for (j = 0; VEC_iterate (lambda_vector, DDR_DIST_VECTS (ddr), j, v); j++)
 458           {
 459             fprintf (file, "DISTANCE_V (");
 460             print_lambda_vector (file, v, DDR_NB_LOOPS (ddr));
 461             fprintf (file, ")\n");
 462           }
 463
 464         for (j = 0; VEC_iterate (lambda_vector, DDR_DIR_VECTS (ddr), j, v); j++)
 465           {
 466             fprintf (file, "DIRECTION_V (");
 467             print_direction_vector (file, v, DDR_NB_LOOPS (ddr));
 468             fprintf (file, ")\n");
 469           }
 470       }
 471
 472   fprintf (file, "\n\n");
 473 }
 474
 475 /* Dumps the data dependence relations DDRS in FILE.  */
 476
 477 void
 478 dump_ddrs (FILE *file, VEC (ddr_p, heap) *ddrs)
 479 {
 480   unsigned int i;
 481   struct data_dependence_relation *ddr;
 482
 483   for (i = 0; VEC_iterate (ddr_p, ddrs, i, ddr); i++)
 484     dump_data_dependence_relation (file, ddr);
 485
 486   fprintf (file, "\n\n");
 487 }
 488
 489 /* Expresses EXP as VAR + OFF, where off is a constant.  The type of OFF
 490    will be ssizetype.  */
 491
 492 static void
 493 split_constant_offset (tree exp, tree *var, tree *off)
 494 {
 495   tree type = TREE_TYPE (exp), otype;
 496   tree var0, var1;
 497   tree off0, off1;
 498   enum tree_code code;
 499
 500   *var = exp;
 501   STRIP_NOPS (exp);
 502   otype = TREE_TYPE (exp);
 503   code = TREE_CODE (exp);
 504
 505   switch (code)
 506     {
 507     case INTEGER_CST:
 508       *var = build_int_cst (type, 0);
 509       *off = fold_convert (ssizetype, exp);
 510       return;
 511
 512     case POINTER_PLUS_EXPR:
 513       code = PLUS_EXPR;
 514       /* FALLTHROUGH */
 515     case PLUS_EXPR:
 516     case MINUS_EXPR:
 517       split_constant_offset (TREE_OPERAND (exp, 0), &var0, &off0);
 518       split_constant_offset (TREE_OPERAND (exp, 1), &var1, &off1);
 519       *var = fold_convert (type, fold_build2 (TREE_CODE (exp), otype,
 520                                               var0, var1));
 521       *off = size_binop (code, off0, off1);
 522       return;
 523
 524     case MULT_EXPR:
 525       off1 = TREE_OPERAND (exp, 1);
 526       if (TREE_CODE (off1) != INTEGER_CST)
 527         break;
 528
 529       split_constant_offset (TREE_OPERAND (exp, 0), &var0, &off0);
 530       *var = fold_convert (type, fold_build2 (MULT_EXPR, otype,
 531                                               var0, off1));
 532       *off = size_binop (MULT_EXPR, off0, fold_convert (ssizetype, off1));
 533       return;
 534
 535     case ADDR_EXPR:
 536       {
 537         tree op, base, poffset;
 538         HOST_WIDE_INT pbitsize, pbitpos;
 539         enum machine_mode pmode;
 540         int punsignedp, pvolatilep;
 541
 542         op = TREE_OPERAND (exp, 0);
 543         if (!handled_component_p (op))
 544           break;
 545
 546         base = get_inner_reference (op, &pbitsize, &pbitpos, &poffset,
 547                                     &pmode, &punsignedp, &pvolatilep, false);
 548
 549         if (pbitpos % BITS_PER_UNIT != 0)
 550           break;
 551         base = build_fold_addr_expr (base);
 552         off0 = ssize_int (pbitpos / BITS_PER_UNIT);
 553
 554         if (poffset)
 555           {
 556             split_constant_offset (poffset, &poffset, &off1);
 557             off0 = size_binop (PLUS_EXPR, off0, off1);
 558             base = fold_build2 (PLUS_EXPR, TREE_TYPE (base),
 559                                 base,
 560                                 fold_convert (TREE_TYPE (base), poffset));
 561           }
 562
 563         *var = fold_convert (type, base);
 564         *off = off0;
 565         return;
 566       }
 567
 568     default:
 569       break;
 570     }
 571
 572   *off = ssize_int (0);
 573 }
 574
 575 /* Returns the address ADDR of an object in a canonical shape (without nop
 576    casts, and with type of pointer to the object).  */
 577
 578 static tree
 579 canonicalize_base_object_address (tree addr)
 580 {
 581   tree orig = addr;
 582
 583   STRIP_NOPS (addr);
 584
 585   /* The base address may be obtained by casting from integer, in that case
 586      keep the cast.  */
 587   if (!POINTER_TYPE_P (TREE_TYPE (addr)))
 588     return orig;
 589
 590   if (TREE_CODE (addr) != ADDR_EXPR)
 591     return addr;
 592
 593   return build_fold_addr_expr (TREE_OPERAND (addr, 0));
 594 }
 595
 596 /* Analyzes the behavior of the memory reference DR in the innermost loop that
 597    contains it.  */
 598
 599 void
 600 dr_analyze_innermost (struct data_reference *dr)
 601 {
 602   tree stmt = DR_STMT (dr);
 603   struct loop *loop = loop_containing_stmt (stmt);
 604   tree ref = DR_REF (dr);
 605   HOST_WIDE_INT pbitsize, pbitpos;
 606   tree base, poffset;
 607   enum machine_mode pmode;
 608   int punsignedp, pvolatilep;
 609   affine_iv base_iv, offset_iv;
 610   tree init, dinit, step;
 611
 612   if (dump_file && (dump_flags & TDF_DETAILS))
 613     fprintf (dump_file, "analyze_innermost: ");
 614
 615   base = get_inner_reference (ref, &pbitsize, &pbitpos, &poffset,
 616                               &pmode, &punsignedp, &pvolatilep, false);
 617   gcc_assert (base != NULL_TREE);
 618
 619   if (pbitpos % BITS_PER_UNIT != 0)
 620     {
 621       if (dump_file && (dump_flags & TDF_DETAILS))
 622         fprintf (dump_file, "failed: bit offset alignment.\n");
 623       return;
 624     }
 625
 626   base = build_fold_addr_expr (base);
 627   if (!simple_iv (loop, stmt, base, &base_iv, false))
 628     {
 629       if (dump_file && (dump_flags & TDF_DETAILS))
 630         fprintf (dump_file, "failed: evolution of base is not affine.\n");
 631       return;
 632     }
 633   if (!poffset)
 634     {
 635       offset_iv.base = ssize_int (0);
 636       offset_iv.step = ssize_int (0);
 637     }
 638   else if (!simple_iv (loop, stmt, poffset, &offset_iv, false))
 639     {
 640       if (dump_file && (dump_flags & TDF_DETAILS))
 641         fprintf (dump_file, "failed: evolution of offset is not affine.\n");
 642       return;
 643     }
 644
 645   init = ssize_int (pbitpos / BITS_PER_UNIT);
 646   split_constant_offset (base_iv.base, &base_iv.base, &dinit);
 647   init =  size_binop (PLUS_EXPR, init, dinit);
 648   split_constant_offset (offset_iv.base, &offset_iv.base, &dinit);
 649   init =  size_binop (PLUS_EXPR, init, dinit);
 650
 651   step = size_binop (PLUS_EXPR,
 652                      fold_convert (ssizetype, base_iv.step),
 653                      fold_convert (ssizetype, offset_iv.step));
 654
 655   DR_BASE_ADDRESS (dr) = canonicalize_base_object_address (base_iv.base);
 656
 657   DR_OFFSET (dr) = fold_convert (ssizetype, offset_iv.base);
 658   DR_INIT (dr) = init;
 659   DR_STEP (dr) = step;
 660
 661   DR_ALIGNED_TO (dr) = size_int (highest_pow2_factor (offset_iv.base));
 662
 663   if (dump_file && (dump_flags & TDF_DETAILS))
 664     fprintf (dump_file, "success.\n");
 665 }
 666
 667 /* Determines the base object and the list of indices of memory reference
 668    DR, analyzed in loop nest NEST.  */
 669
 670 static void
 671 dr_analyze_indices (struct data_reference *dr, struct loop *nest)
 672 {
 673   tree stmt = DR_STMT (dr);
 674   struct loop *loop = loop_containing_stmt (stmt);
 675   VEC (tree, heap) *access_fns = NULL;
 676   tree ref = unshare_expr (DR_REF (dr)), aref = ref, op;
 677   tree base, off, access_fn;
 678
 679   while (handled_component_p (aref))
 680     {
 681       if (TREE_CODE (aref) == ARRAY_REF)
 682         {
 683           op = TREE_OPERAND (aref, 1);
 684           access_fn = analyze_scalar_evolution (loop, op);
 685           access_fn = resolve_mixers (nest, access_fn);
 686           VEC_safe_push (tree, heap, access_fns, access_fn);
 687
 688           TREE_OPERAND (aref, 1) = build_int_cst (TREE_TYPE (op), 0);
 689         }
 690
 691       aref = TREE_OPERAND (aref, 0);
 692     }
 693
 694   if (INDIRECT_REF_P (aref))
 695     {
 696       op = TREE_OPERAND (aref, 0);
 697       access_fn = analyze_scalar_evolution (loop, op);
 698       access_fn = resolve_mixers (nest, access_fn);
 699       base = initial_condition (access_fn);
 700       split_constant_offset (base, &base, &off);
 701       access_fn = chrec_replace_initial_condition (access_fn,
 702                         fold_convert (TREE_TYPE (base), off));
 703
 704       TREE_OPERAND (aref, 0) = base;
 705       VEC_safe_push (tree, heap, access_fns, access_fn);
 706     }
 707
 708   DR_BASE_OBJECT (dr) = ref;
 709   DR_ACCESS_FNS (dr) = access_fns;
 710 }
 711
 712 /* Extracts the alias analysis information from the memory reference DR.  */
 713
 714 static void
 715 dr_analyze_alias (struct data_reference *dr)
 716 {
 717   tree stmt = DR_STMT (dr);
 718   tree ref = DR_REF (dr);
 719   tree base = get_base_address (ref), addr, smt = NULL_TREE;
 720   ssa_op_iter it;
 721   tree op;
 722   bitmap vops;
 723
 724   if (DECL_P (base))
 725     smt = base;
 726   else if (INDIRECT_REF_P (base))
 727     {
 728       addr = TREE_OPERAND (base, 0);
 729       if (TREE_CODE (addr) == SSA_NAME)
 730         {
 731           smt = symbol_mem_tag (SSA_NAME_VAR (addr));
 732           DR_PTR_INFO (dr) = SSA_NAME_PTR_INFO (addr);
 733         }
 734     }
 735
 736   DR_SYMBOL_TAG (dr) = smt;
 737   if (smt && var_can_have_subvars (smt))
 738     DR_SUBVARS (dr) = get_subvars_for_var (smt);
 739
 740   vops = BITMAP_ALLOC (NULL);
 741   FOR_EACH_SSA_TREE_OPERAND (op, stmt, it, SSA_OP_VIRTUAL_USES)
 742     {
 743       bitmap_set_bit (vops, DECL_UID (SSA_NAME_VAR (op)));
 744     }
 745
 746   DR_VOPS (dr) = vops;
 747 }
 748
 749 /* Returns true if the address of DR is invariant.  */
 750
 751 static bool
 752 dr_address_invariant_p (struct data_reference *dr)
 753 {
 754   unsigned i;
 755   tree idx;
 756
 757   for (i = 0; VEC_iterate (tree, DR_ACCESS_FNS (dr), i, idx); i++)
 758     if (tree_contains_chrecs (idx, NULL))
 759       return false;
 760
 761   return true;
 762 }
 763
 764 /* Frees data reference DR.  */
 765
 766 static void
 767 free_data_ref (data_reference_p dr)
 768 {
 769   BITMAP_FREE (DR_VOPS (dr));
 770   VEC_free (tree, heap, DR_ACCESS_FNS (dr));
 771   free (dr);
 772 }
 773
 774 /* Analyzes memory reference MEMREF accessed in STMT.  The reference
 775    is read if IS_READ is true, write otherwise.  Returns the
 776    data_reference description of MEMREF.  NEST is the outermost loop of the
 777    loop nest in that the reference should be analyzed.  */
 778
 779 struct data_reference *
 780 create_data_ref (struct loop *nest, tree memref, tree stmt, bool is_read)
 781 {
 782   struct data_reference *dr;
 783
 784   if (dump_file && (dump_flags & TDF_DETAILS))
 785     {
 786       fprintf (dump_file, "Creating dr for ");
 787       print_generic_expr (dump_file, memref, TDF_SLIM);
 788       fprintf (dump_file, "\n");
 789     }
 790
 791   dr = XCNEW (struct data_reference);
 792   DR_STMT (dr) = stmt;
 793   DR_REF (dr) = memref;
 794   DR_IS_READ (dr) = is_read;
 795
 796   dr_analyze_innermost (dr);
 797   dr_analyze_indices (dr, nest);
 798   dr_analyze_alias (dr);
 799
 800   if (dump_file && (dump_flags & TDF_DETAILS))
 801     {
 802       fprintf (dump_file, "\tbase_address: ");
 803       print_generic_expr (dump_file, DR_BASE_ADDRESS (dr), TDF_SLIM);
 804       fprintf (dump_file, "\n\toffset from base address: ");
 805       print_generic_expr (dump_file, DR_OFFSET (dr), TDF_SLIM);
 806       fprintf (dump_file, "\n\tconstant offset from base address: ");
 807       print_generic_expr (dump_file, DR_INIT (dr), TDF_SLIM);
 808       fprintf (dump_file, "\n\tstep: ");
 809       print_generic_expr (dump_file, DR_STEP (dr), TDF_SLIM);
 810       fprintf (dump_file, "\n\taligned to: ");
 811       print_generic_expr (dump_file, DR_ALIGNED_TO (dr), TDF_SLIM);
 812       fprintf (dump_file, "\n\tbase_object: ");
 813       print_generic_expr (dump_file, DR_BASE_OBJECT (dr), TDF_SLIM);
 814       fprintf (dump_file, "\n\tsymbol tag: ");
 815       print_generic_expr (dump_file, DR_SYMBOL_TAG (dr), TDF_SLIM);
 816       fprintf (dump_file, "\n");
 817     }
 818
 819   return dr;
 820 }
 821
 822 /* Returns true if FNA == FNB.  */
 823
 824 static bool
 825 affine_function_equal_p (affine_fn fna, affine_fn fnb)
 826 {
 827   unsigned i, n = VEC_length (tree, fna);
 828
 829   if (n != VEC_length (tree, fnb))
 830     return false;
 831
 832   for (i = 0; i < n; i++)
 833     if (!operand_equal_p (VEC_index (tree, fna, i),
 834                           VEC_index (tree, fnb, i), 0))
 835       return false;
 836
 837   return true;
 838 }
 839
 840 /* If all the functions in CF are the same, returns one of them,
 841    otherwise returns NULL.  */
 842
 843 static affine_fn
 844 common_affine_function (conflict_function *cf)
 845 {
 846   unsigned i;
 847   affine_fn comm;
 848
 849   if (!CF_NONTRIVIAL_P (cf))
 850     return NULL;
 851
 852   comm = cf->fns[0];
 853
 854   for (i = 1; i < cf->n; i++)
 855     if (!affine_function_equal_p (comm, cf->fns[i]))
 856       return NULL;
 857
 858   return comm;
 859 }
 860
 861 /* Returns the base of the affine function FN.  */
 862
 863 static tree
 864 affine_function_base (affine_fn fn)
 865 {
 866   return VEC_index (tree, fn, 0);
 867 }
 868
 869 /* Returns true if FN is a constant.  */
 870
 871 static bool
 872 affine_function_constant_p (affine_fn fn)
 873 {
 874   unsigned i;
 875   tree coef;
 876
 877   for (i = 1; VEC_iterate (tree, fn, i, coef); i++)
 878     if (!integer_zerop (coef))
 879       return false;
 880
 881   return true;
 882 }
 883
 884 /* Returns true if FN is the zero constant function.  */
 885
 886 static bool
 887 affine_function_zero_p (affine_fn fn)
 888 {
 889   return (integer_zerop (affine_function_base (fn))
 890           && affine_function_constant_p (fn));
 891 }
 892
 893 /* Applies operation OP on affine functions FNA and FNB, and returns the
 894    result.  */
 895
 896 static affine_fn
 897 affine_fn_op (enum tree_code op, affine_fn fna, affine_fn fnb)
 898 {
 899   unsigned i, n, m;
 900   affine_fn ret;
 901   tree coef;
 902
 903   if (VEC_length (tree, fnb) > VEC_length (tree, fna))
 904     {
 905       n = VEC_length (tree, fna);
 906       m = VEC_length (tree, fnb);
 907     }
 908   else
 909     {
 910       n = VEC_length (tree, fnb);
 911       m = VEC_length (tree, fna);
 912     }
 913
 914   ret = VEC_alloc (tree, heap, m);
 915   for (i = 0; i < n; i++)
 916     VEC_quick_push (tree, ret,
 917                     fold_build2 (op, integer_type_node,
 918                                  VEC_index (tree, fna, i),
 919                                  VEC_index (tree, fnb, i)));
 920
 921   for (; VEC_iterate (tree, fna, i, coef); i++)
 922     VEC_quick_push (tree, ret,
 923                     fold_build2 (op, integer_type_node,
 924                                  coef, integer_zero_node));
 925   for (; VEC_iterate (tree, fnb, i, coef); i++)
 926     VEC_quick_push (tree, ret,
 927                     fold_build2 (op, integer_type_node,
 928                                  integer_zero_node, coef));
 929
 930   return ret;
 931 }
 932
 933 /* Returns the sum of affine functions FNA and FNB.  */
 934
 935 static affine_fn
 936 affine_fn_plus (affine_fn fna, affine_fn fnb)
 937 {
 938   return affine_fn_op (PLUS_EXPR, fna, fnb);
 939 }
 940
 941 /* Returns the difference of affine functions FNA and FNB.  */
 942
 943 static affine_fn
 944 affine_fn_minus (affine_fn fna, affine_fn fnb)
 945 {
 946   return affine_fn_op (MINUS_EXPR, fna, fnb);
 947 }
 948
 949 /* Frees affine function FN.  */
 950
 951 static void
 952 affine_fn_free (affine_fn fn)
 953 {
 954   VEC_free (tree, heap, fn);
 955 }
 956
 957 /* Determine for each subscript in the data dependence relation DDR
 958    the distance.  */
 959
 960 static void
 961 compute_subscript_distance (struct data_dependence_relation *ddr)
 962 {
 963   conflict_function *cf_a, *cf_b;
 964   affine_fn fn_a, fn_b, diff;
 965
 966   if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
 967     {
 968       unsigned int i;
 969
 970       for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
 971         {
 972           struct subscript *subscript;
 973
 974           subscript = DDR_SUBSCRIPT (ddr, i);
 975           cf_a = SUB_CONFLICTS_IN_A (subscript);
 976           cf_b = SUB_CONFLICTS_IN_B (subscript);
 977
 978           fn_a = common_affine_function (cf_a);
 979           fn_b = common_affine_function (cf_b);
 980           if (!fn_a || !fn_b)
 981             {
 982               SUB_DISTANCE (subscript) = chrec_dont_know;
 983               return;
 984             }
 985           diff = affine_fn_minus (fn_a, fn_b);
 986
 987           if (affine_function_constant_p (diff))
 988             SUB_DISTANCE (subscript) = affine_function_base (diff);
 989           else
 990             SUB_DISTANCE (subscript) = chrec_dont_know;
 991
 992           affine_fn_free (diff);
 993         }
 994     }
 995 }
 996
 997 /* Returns the conflict function for "unknown".  */
 998
 999 static conflict_function *
1000 conflict_fn_not_known (void)
1001 {
1002   conflict_function *fn = XCNEW (conflict_function);
1003   fn->n = NOT_KNOWN;
1004
1005   return fn;
1006 }
1007
1008 /* Returns the conflict function for "independent".  */
1009
1010 static conflict_function *
1011 conflict_fn_no_dependence (void)
1012 {
1013   conflict_function *fn = XCNEW (conflict_function);
1014   fn->n = NO_DEPENDENCE;
1015
1016   return fn;
1017 }
1018
1019 /* Returns true if the address of OBJ is invariant in LOOP.  */
1020
1021 static bool
1022 object_address_invariant_in_loop_p (struct loop *loop, tree obj)
1023 {
1024   while (handled_component_p (obj))
1025     {
1026       if (TREE_CODE (obj) == ARRAY_REF)
1027         {
1028           /* Index of the ARRAY_REF was zeroed in analyze_indices, thus we only
1029              need to check the stride and the lower bound of the reference.  */
1030           if (chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 2),
1031                                                       loop->num)
1032               || chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 3),
1033                                                          loop->num))
1034             return false;
1035         }
1036       else if (TREE_CODE (obj) == COMPONENT_REF)
1037         {
1038           if (chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 2),
1039                                                       loop->num))
1040             return false;
1041         }
1042       obj = TREE_OPERAND (obj, 0);
1043     }
1044
1045   if (!INDIRECT_REF_P (obj))
1046     return true;
1047
1048   return !chrec_contains_symbols_defined_in_loop (TREE_OPERAND (obj, 0),
1049                                                   loop->num);
1050 }
1051
1052 /* Returns true if A and B are accesses to different objects, or to different
1053    fields of the same object.  */
1054
1055 static bool
1056 disjoint_objects_p (tree a, tree b)
1057 {
1058   tree base_a, base_b;
1059   VEC (tree, heap) *comp_a = NULL, *comp_b = NULL;
1060   bool ret;
1061
1062   base_a = get_base_address (a);
1063   base_b = get_base_address (b);
1064
1065   if (DECL_P (base_a)
1066       && DECL_P (base_b)
1067       && base_a != base_b)
1068     return true;
1069
1070   if (!operand_equal_p (base_a, base_b, 0))
1071     return false;
1072
1073   /* Compare the component references of A and B.  We must start from the inner
1074      ones, so record them to the vector first.  */
1075   while (handled_component_p (a))
1076     {
1077       VEC_safe_push (tree, heap, comp_a, a);
1078       a = TREE_OPERAND (a, 0);
1079     }
1080   while (handled_component_p (b))
1081     {
1082       VEC_safe_push (tree, heap, comp_b, b);
1083       b = TREE_OPERAND (b, 0);
1084     }
1085
1086   ret = false;
1087   while (1)
1088     {
1089       if (VEC_length (tree, comp_a) == 0
1090           || VEC_length (tree, comp_b) == 0)
1091         break;
1092
1093       a = VEC_pop (tree, comp_a);
1094       b = VEC_pop (tree, comp_b);
1095
1096       /* Real and imaginary part of a variable do not alias.  */
1097       if ((TREE_CODE (a) == REALPART_EXPR
1098            && TREE_CODE (b) == IMAGPART_EXPR)
1099           || (TREE_CODE (a) == IMAGPART_EXPR
1100               && TREE_CODE (b) == REALPART_EXPR))
1101         {
1102           ret = true;
1103           break;
1104         }
1105
1106       if (TREE_CODE (a) != TREE_CODE (b))
1107         break;
1108
1109       /* Nothing to do for ARRAY_REFs, as the indices of array_refs in
1110          DR_BASE_OBJECT are always zero.  */
1111       if (TREE_CODE (a) == ARRAY_REF)
1112         continue;
1113       else if (TREE_CODE (a) == COMPONENT_REF)
1114         {
1115           if (operand_equal_p (TREE_OPERAND (a, 1), TREE_OPERAND (b, 1), 0))
1116             continue;
1117
1118           /* Different fields of unions may overlap.  */
1119           base_a = TREE_OPERAND (a, 0);
1120           if (TREE_CODE (TREE_TYPE (base_a)) == UNION_TYPE)
1121             break;
1122
1123           /* Different fields of structures cannot.  */
1124           ret = true;
1125           break;
1126         }
1127       else
1128         break;
1129     }
1130
1131   VEC_free (tree, heap, comp_a);
1132   VEC_free (tree, heap, comp_b);
1133
1134   return ret;
1135 }
1136
1137 /* Returns false if we can prove that data references A and B do not alias,
1138    true otherwise.  */
1139
1140 static bool
1141 dr_may_alias_p (struct data_reference *a, struct data_reference *b)
1142 {
1143   tree addr_a = DR_BASE_ADDRESS (a);
1144   tree addr_b = DR_BASE_ADDRESS (b);
1145   tree type_a, type_b;
1146   tree decl_a = NULL_TREE, decl_b = NULL_TREE;
1147
1148   /* If the sets of virtual operands are disjoint, the memory references do not
1149      alias.  */
1150   if (!bitmap_intersect_p (DR_VOPS (a), DR_VOPS (b)))
1151     return false;
1152
1153   /* If the accessed objects are disjoint, the memory references do not
1154      alias.  */
1155   if (disjoint_objects_p (DR_BASE_OBJECT (a), DR_BASE_OBJECT (b)))
1156     return false;
1157
1158   if (!addr_a || !addr_b)
1159     return true;
1160
1161   /* If the references are based on different static objects, they cannot alias
1162      (PTA should be able to disambiguate such accesses, but often it fails to,
1163      since currently we cannot distinguish between pointer and offset in pointer
1164      arithmetics).  */
1165   if (TREE_CODE (addr_a) == ADDR_EXPR
1166       && TREE_CODE (addr_b) == ADDR_EXPR)
1167     return TREE_OPERAND (addr_a, 0) == TREE_OPERAND (addr_b, 0);
1168
1169   /* An instruction writing through a restricted pointer is "independent" of any
1170      instruction reading or writing through a different restricted pointer,
1171      in the same block/scope.  */
1172
1173   type_a = TREE_TYPE (addr_a);
1174   type_b = TREE_TYPE (addr_b);
1175   gcc_assert (POINTER_TYPE_P (type_a) && POINTER_TYPE_P (type_b));
1176
1177   if (TREE_CODE (addr_a) == SSA_NAME)
1178     decl_a = SSA_NAME_VAR (addr_a);
1179   if (TREE_CODE (addr_b) == SSA_NAME)
1180     decl_b = SSA_NAME_VAR (addr_b);
1181
1182   if (TYPE_RESTRICT (type_a) && TYPE_RESTRICT (type_b)
1183       && (!DR_IS_READ (a) || !DR_IS_READ (b))
1184       && decl_a && DECL_P (decl_a)
1185       && decl_b && DECL_P (decl_b)
1186       && decl_a != decl_b
1187       && TREE_CODE (DECL_CONTEXT (decl_a)) == FUNCTION_DECL
1188       && DECL_CONTEXT (decl_a) == DECL_CONTEXT (decl_b))
1189     return false;
1190
1191   return true;
1192 }
1193
1194 /* Initialize a data dependence relation between data accesses A and
1195    B.  NB_LOOPS is the number of loops surrounding the references: the
1196    size of the classic distance/direction vectors.  */
1197
1198 static struct data_dependence_relation *
1199 initialize_data_dependence_relation (struct data_reference *a,
1200                                      struct data_reference *b,
1201                                      VEC (loop_p, heap) *loop_nest)
1202 {
1203   struct data_dependence_relation *res;
1204   unsigned int i;
1205
1206   res = XNEW (struct data_dependence_relation);
1207   DDR_A (res) = a;
1208   DDR_B (res) = b;
1209   DDR_LOOP_NEST (res) = NULL;
1210
1211   if (a == NULL || b == NULL)
1212     {
1213       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1214       return res;
1215     }
1216
1217   /* If the data references do not alias, then they are independent.  */
1218   if (!dr_may_alias_p (a, b))
1219     {
1220       DDR_ARE_DEPENDENT (res) = chrec_known;
1221       return res;
1222     }
1223
1224   /* If the references do not access the same object, we do not know
1225      whether they alias or not.  */
1226   if (!operand_equal_p (DR_BASE_OBJECT (a), DR_BASE_OBJECT (b), 0))
1227     {
1228       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1229       return res;
1230     }
1231
1232   /* If the base of the object is not invariant in the loop nest, we cannot
1233      analyze it.  TODO -- in fact, it would suffice to record that there may
1234      be arbitrary dependences in the loops where the base object varies.  */
1235   if (!object_address_invariant_in_loop_p (VEC_index (loop_p, loop_nest, 0),
1236                                            DR_BASE_OBJECT (a)))
1237     {
1238       DDR_ARE_DEPENDENT (res) = chrec_dont_know;
1239       return res;
1240     }
1241
1242   gcc_assert (DR_NUM_DIMENSIONS (a) == DR_NUM_DIMENSIONS (b));
1243
1244   DDR_AFFINE_P (res) = true;
1245   DDR_ARE_DEPENDENT (res) = NULL_TREE;
1246   DDR_SUBSCRIPTS (res) = VEC_alloc (subscript_p, heap, DR_NUM_DIMENSIONS (a));
1247   DDR_LOOP_NEST (res) = loop_nest;
1248   DDR_INNER_LOOP (res) = 0;
1249   DDR_DIR_VECTS (res) = NULL;
1250   DDR_DIST_VECTS (res) = NULL;
1251
1252   for (i = 0; i < DR_NUM_DIMENSIONS (a); i++)
1253     {
1254       struct subscript *subscript;
1255
1256       subscript = XNEW (struct subscript);
1257       SUB_CONFLICTS_IN_A (subscript) = conflict_fn_not_known ();
1258       SUB_CONFLICTS_IN_B (subscript) = conflict_fn_not_known ();
1259       SUB_LAST_CONFLICT (subscript) = chrec_dont_know;
1260       SUB_DISTANCE (subscript) = chrec_dont_know;
1261       VEC_safe_push (subscript_p, heap, DDR_SUBSCRIPTS (res), subscript);
1262     }
1263
1264   return res;
1265 }
1266
1267 /* Frees memory used by the conflict function F.  */
1268
1269 static void
1270 free_conflict_function (conflict_function *f)
1271 {
1272   unsigned i;
1273
1274   if (CF_NONTRIVIAL_P (f))
1275     {
1276       for (i = 0; i < f->n; i++)
1277         affine_fn_free (f->fns[i]);
1278     }
1279   free (f);
1280 }
1281
1282 /* Frees memory used by SUBSCRIPTS.  */
1283
1284 static void
1285 free_subscripts (VEC (subscript_p, heap) *subscripts)
1286 {
1287   unsigned i;
1288   subscript_p s;
1289
1290   for (i = 0; VEC_iterate (subscript_p, subscripts, i, s); i++)
1291     {
1292       free_conflict_function (s->conflicting_iterations_in_a);
1293       free_conflict_function (s->conflicting_iterations_in_b);
1294     }
1295   VEC_free (subscript_p, heap, subscripts);
1296 }
1297
1298 /* Set DDR_ARE_DEPENDENT to CHREC and finalize the subscript overlap
1299    description.  */
1300
1301 static inline void
1302 finalize_ddr_dependent (struct data_dependence_relation *ddr,
1303                         tree chrec)
1304 {
1305   if (dump_file && (dump_flags & TDF_DETAILS))
1306     {
1307       fprintf (dump_file, "(dependence classified: ");
1308       print_generic_expr (dump_file, chrec, 0);
1309       fprintf (dump_file, ")\n");
1310     }
1311
1312   DDR_ARE_DEPENDENT (ddr) = chrec;
1313   free_subscripts (DDR_SUBSCRIPTS (ddr));
1314 }
1315
1316 /* The dependence relation DDR cannot be represented by a distance
1317    vector.  */
1318
1319 static inline void
1320 non_affine_dependence_relation (struct data_dependence_relation *ddr)
1321 {
1322   if (dump_file && (dump_flags & TDF_DETAILS))
1323     fprintf (dump_file, "(Dependence relation cannot be represented by distance vector.) \n");
1324
1325   DDR_AFFINE_P (ddr) = false;
1326 }
1327
1328 \f
1329
1330 /* This section contains the classic Banerjee tests.  */
1331
1332 /* Returns true iff CHREC_A and CHREC_B are not dependent on any index
1333    variables, i.e., if the ZIV (Zero Index Variable) test is true.  */
1334
1335 static inline bool
1336 ziv_subscript_p (tree chrec_a,
1337                  tree chrec_b)
1338 {
1339   return (evolution_function_is_constant_p (chrec_a)
1340           && evolution_function_is_constant_p (chrec_b));
1341 }
1342
1343 /* Returns true iff CHREC_A and CHREC_B are dependent on an index
1344    variable, i.e., if the SIV (Single Index Variable) test is true.  */
1345
1346 static bool
1347 siv_subscript_p (tree chrec_a,
1348                  tree chrec_b)
1349 {
1350   if ((evolution_function_is_constant_p (chrec_a)
1351        && evolution_function_is_univariate_p (chrec_b))
1352       || (evolution_function_is_constant_p (chrec_b)
1353           && evolution_function_is_univariate_p (chrec_a)))
1354     return true;
1355
1356   if (evolution_function_is_univariate_p (chrec_a)
1357       && evolution_function_is_univariate_p (chrec_b))
1358     {
1359       switch (TREE_CODE (chrec_a))
1360         {
1361         case POLYNOMIAL_CHREC:
1362           switch (TREE_CODE (chrec_b))
1363             {
1364             case POLYNOMIAL_CHREC:
1365               if (CHREC_VARIABLE (chrec_a) != CHREC_VARIABLE (chrec_b))
1366                 return false;
1367
1368             default:
1369               return true;
1370             }
1371
1372         default:
1373           return true;
1374         }
1375     }
1376
1377   return false;
1378 }
1379
1380 /* Creates a conflict function with N dimensions.  The affine functions
1381    in each dimension follow.  */
1382
1383 static conflict_function *
1384 conflict_fn (unsigned n, ...)
1385 {
1386   unsigned i;
1387   conflict_function *ret = XCNEW (conflict_function);
1388   va_list ap;
1389
1390   gcc_assert (0 < n && n <= MAX_DIM);
1391   va_start(ap, n);
1392
1393   ret->n = n;
1394   for (i = 0; i < n; i++)
1395     ret->fns[i] = va_arg (ap, affine_fn);
1396   va_end(ap);
1397
1398   return ret;
1399 }
1400
1401 /* Returns constant affine function with value CST.  */
1402
1403 static affine_fn
1404 affine_fn_cst (tree cst)
1405 {
1406   affine_fn fn = VEC_alloc (tree, heap, 1);
1407   VEC_quick_push (tree, fn, cst);
1408   return fn;
1409 }
1410
1411 /* Returns affine function with single variable, CST + COEF * x_DIM.  */
1412
1413 static affine_fn
1414 affine_fn_univar (tree cst, unsigned dim, tree coef)
1415 {
1416   affine_fn fn = VEC_alloc (tree, heap, dim + 1);
1417   unsigned i;
1418
1419   gcc_assert (dim > 0);
1420   VEC_quick_push (tree, fn, cst);
1421   for (i = 1; i < dim; i++)
1422     VEC_quick_push (tree, fn, integer_zero_node);
1423   VEC_quick_push (tree, fn, coef);
1424   return fn;
1425 }
1426
1427 /* Analyze a ZIV (Zero Index Variable) subscript.  *OVERLAPS_A and
1428    *OVERLAPS_B are initialized to the functions that describe the
1429    relation between the elements accessed twice by CHREC_A and
1430    CHREC_B.  For k >= 0, the following property is verified:
1431
1432    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
1433
1434 static void
1435 analyze_ziv_subscript (tree chrec_a,
1436                        tree chrec_b,
1437                        conflict_function **overlaps_a,
1438                        conflict_function **overlaps_b,
1439                        tree *last_conflicts)
1440 {
1441   tree difference;
1442   dependence_stats.num_ziv++;
1443
1444   if (dump_file && (dump_flags & TDF_DETAILS))
1445     fprintf (dump_file, "(analyze_ziv_subscript \n");
1446
1447   chrec_a = chrec_convert (integer_type_node, chrec_a, NULL_TREE);
1448   chrec_b = chrec_convert (integer_type_node, chrec_b, NULL_TREE);
1449   difference = chrec_fold_minus (integer_type_node, chrec_a, chrec_b);
1450
1451   switch (TREE_CODE (difference))
1452     {
1453     case INTEGER_CST:
1454       if (integer_zerop (difference))
1455         {
1456           /* The difference is equal to zero: the accessed index
1457              overlaps for each iteration in the loop.  */
1458           *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1459           *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
1460           *last_conflicts = chrec_dont_know;
1461           dependence_stats.num_ziv_dependent++;
1462         }
1463       else
1464         {
1465           /* The accesses do not overlap.  */
1466           *overlaps_a = conflict_fn_no_dependence ();
1467           *overlaps_b = conflict_fn_no_dependence ();
1468           *last_conflicts = integer_zero_node;
1469           dependence_stats.num_ziv_independent++;
1470         }
1471       break;
1472
1473     default:
1474       /* We're not sure whether the indexes overlap.  For the moment,
1475          conservatively answer "don't know".  */
1476       if (dump_file && (dump_flags & TDF_DETAILS))
1477         fprintf (dump_file, "ziv test failed: difference is non-integer.\n");
1478
1479       *overlaps_a = conflict_fn_not_known ();
1480       *overlaps_b = conflict_fn_not_known ();
1481       *last_conflicts = chrec_dont_know;
1482       dependence_stats.num_ziv_unimplemented++;
1483       break;
1484     }
1485
1486   if (dump_file && (dump_flags & TDF_DETAILS))
1487     fprintf (dump_file, ")\n");
1488 }
1489
1490 /* Sets NIT to the estimated number of executions of the statements in
1491    LOOP.  If CONSERVATIVE is true, we must be sure that NIT is at least as
1492    large as the number of iterations.  If we have no reliable estimate,
1493    the function returns false, otherwise returns true.  */
1494
1495 bool
1496 estimated_loop_iterations (struct loop *loop, bool conservative,
1497                            double_int *nit)
1498 {
1499   estimate_numbers_of_iterations_loop (loop);
1500   if (conservative)
1501     {
1502       if (!loop->any_upper_bound)
1503         return false;
1504
1505       *nit = loop->nb_iterations_upper_bound;
1506     }
1507   else
1508     {
1509       if (!loop->any_estimate)
1510         return false;
1511
1512       *nit = loop->nb_iterations_estimate;
1513     }
1514
1515   return true;
1516 }
1517
1518 /* Similar to estimated_loop_iterations, but returns the estimate only
1519    if it fits to HOST_WIDE_INT.  If this is not the case, or the estimate
1520    on the number of iterations of LOOP could not be derived, returns -1.  */
1521
1522 HOST_WIDE_INT
1523 estimated_loop_iterations_int (struct loop *loop, bool conservative)
1524 {
1525   double_int nit;
1526   HOST_WIDE_INT hwi_nit;
1527
1528   if (!estimated_loop_iterations (loop, conservative, &nit))
1529     return -1;
1530
1531   if (!double_int_fits_in_shwi_p (nit))
1532     return -1;
1533   hwi_nit = double_int_to_shwi (nit);
1534
1535   return hwi_nit < 0 ? -1 : hwi_nit;
1536 }
1537
1538 /* Similar to estimated_loop_iterations, but returns the estimate as a tree,
1539    and only if it fits to the int type.  If this is not the case, or the
1540    estimate on the number of iterations of LOOP could not be derived, returns
1541    chrec_dont_know.  */
1542
1543 static tree
1544 estimated_loop_iterations_tree (struct loop *loop, bool conservative)
1545 {
1546   double_int nit;
1547   tree type;
1548
1549   if (!estimated_loop_iterations (loop, conservative, &nit))
1550     return chrec_dont_know;
1551
1552   type = lang_hooks.types.type_for_size (INT_TYPE_SIZE, true);
1553   if (!double_int_fits_to_tree_p (type, nit))
1554     return chrec_dont_know;
1555
1556   return double_int_to_tree (type, nit);
1557 }
1558
1559 /* Analyze a SIV (Single Index Variable) subscript where CHREC_A is a
1560    constant, and CHREC_B is an affine function.  *OVERLAPS_A and
1561    *OVERLAPS_B are initialized to the functions that describe the
1562    relation between the elements accessed twice by CHREC_A and
1563    CHREC_B.  For k >= 0, the following property is verified:
1564
1565    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
1566
1567 static void
1568 analyze_siv_subscript_cst_affine (tree chrec_a,
1569                                   tree chrec_b,
1570                                   conflict_function **overlaps_a,
1571                                   conflict_function **overlaps_b,
1572                                   tree *last_conflicts)
1573 {
1574   bool value0, value1, value2;
1575   tree difference, tmp;
1576
1577   chrec_a = chrec_convert (integer_type_node, chrec_a, NULL_TREE);
1578   chrec_b = chrec_convert (integer_type_node, chrec_b, NULL_TREE);
1579   difference = chrec_fold_minus
1580     (integer_type_node, initial_condition (chrec_b), chrec_a);
1581
1582   if (!chrec_is_positive (initial_condition (difference), &value0))
1583     {
1584       if (dump_file && (dump_flags & TDF_DETAILS))
1585         fprintf (dump_file, "siv test failed: chrec is not positive.\n");
1586
1587       dependence_stats.num_siv_unimplemented++;
1588       *overlaps_a = conflict_fn_not_known ();
1589       *overlaps_b = conflict_fn_not_known ();
1590       *last_conflicts = chrec_dont_know;
1591       return;
1592     }
1593   else
1594     {
1595       if (value0 == false)
1596         {
1597           if (!chrec_is_positive (CHREC_RIGHT (chrec_b), &value1))
1598             {
1599               if (dump_file && (dump_flags & TDF_DETAILS))
1600                 fprintf (dump_file, "siv test failed: chrec not positive.\n");
1601
1602               *overlaps_a = conflict_fn_not_known ();
1603               *overlaps_b = conflict_fn_not_known ();
1604               *last_conflicts = chrec_dont_know;
1605               dependence_stats.num_siv_unimplemented++;
1606               return;
1607             }
1608           else
1609             {
1610               if (value1 == true)
1611                 {
1612                   /* Example:
1613                      chrec_a = 12
1614                      chrec_b = {10, +, 1}
1615                   */
1616
1617                   if (tree_fold_divides_p (CHREC_RIGHT (chrec_b), difference))
1618                     {
1619                       HOST_WIDE_INT numiter;
1620                       struct loop *loop = get_chrec_loop (chrec_b);
1621
1622                       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1623                       tmp = fold_build2 (EXACT_DIV_EXPR, integer_type_node,
1624                                          fold_build1 (ABS_EXPR,
1625                                                       integer_type_node,
1626                                                       difference),
1627                                          CHREC_RIGHT (chrec_b));
1628                       *overlaps_b = conflict_fn (1, affine_fn_cst (tmp));
1629                       *last_conflicts = integer_one_node;
1630
1631
1632                       /* Perform weak-zero siv test to see if overlap is
1633                          outside the loop bounds.  */
1634                       numiter = estimated_loop_iterations_int (loop, true);
1635
1636                       if (numiter >= 0
1637                           && compare_tree_int (tmp, numiter) > 0)
1638                         {
1639                           free_conflict_function (*overlaps_a);
1640                           free_conflict_function (*overlaps_b);
1641                           *overlaps_a = conflict_fn_no_dependence ();
1642                           *overlaps_b = conflict_fn_no_dependence ();
1643                           *last_conflicts = integer_zero_node;
1644                           dependence_stats.num_siv_independent++;
1645                           return;
1646                         }
1647                       dependence_stats.num_siv_dependent++;
1648                       return;
1649                     }
1650
1651                   /* When the step does not divide the difference, there are
1652                      no overlaps.  */
1653                   else
1654                     {
1655                       *overlaps_a = conflict_fn_no_dependence ();
1656                       *overlaps_b = conflict_fn_no_dependence ();
1657                       *last_conflicts = integer_zero_node;
1658                       dependence_stats.num_siv_independent++;
1659                       return;
1660                     }
1661                 }
1662
1663               else
1664                 {
1665                   /* Example:
1666                      chrec_a = 12
1667                      chrec_b = {10, +, -1}
1668
1669                      In this case, chrec_a will not overlap with chrec_b.  */
1670                   *overlaps_a = conflict_fn_no_dependence ();
1671                   *overlaps_b = conflict_fn_no_dependence ();
1672                   *last_conflicts = integer_zero_node;
1673                   dependence_stats.num_siv_independent++;
1674                   return;
1675                 }
1676             }
1677         }
1678       else
1679         {
1680           if (!chrec_is_positive (CHREC_RIGHT (chrec_b), &value2))
1681             {
1682               if (dump_file && (dump_flags & TDF_DETAILS))
1683                 fprintf (dump_file, "siv test failed: chrec not positive.\n");
1684
1685               *overlaps_a = conflict_fn_not_known ();
1686               *overlaps_b = conflict_fn_not_known ();
1687               *last_conflicts = chrec_dont_know;
1688               dependence_stats.num_siv_unimplemented++;
1689               return;
1690             }
1691           else
1692             {
1693               if (value2 == false)
1694                 {
1695                   /* Example:
1696                      chrec_a = 3
1697                      chrec_b = {10, +, -1}
1698                   */
1699                   if (tree_fold_divides_p (CHREC_RIGHT (chrec_b), difference))
1700                     {
1701                       HOST_WIDE_INT numiter;
1702                       struct loop *loop = get_chrec_loop (chrec_b);
1703
1704                       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1705                       tmp = fold_build2 (EXACT_DIV_EXPR,
1706                                          integer_type_node, difference,
1707                                          CHREC_RIGHT (chrec_b));
1708                       *overlaps_b = conflict_fn (1, affine_fn_cst (tmp));
1709                       *last_conflicts = integer_one_node;
1710
1711                       /* Perform weak-zero siv test to see if overlap is
1712                          outside the loop bounds.  */
1713                       numiter = estimated_loop_iterations_int (loop, true);
1714
1715                       if (numiter >= 0
1716                           && compare_tree_int (tmp, numiter) > 0)
1717                         {
1718                           free_conflict_function (*overlaps_a);
1719                           free_conflict_function (*overlaps_b);
1720                           *overlaps_a = conflict_fn_no_dependence ();
1721                           *overlaps_b = conflict_fn_no_dependence ();
1722                           *last_conflicts = integer_zero_node;
1723                           dependence_stats.num_siv_independent++;
1724                           return;
1725                         }
1726                       dependence_stats.num_siv_dependent++;
1727                       return;
1728                     }
1729
1730                   /* When the step does not divide the difference, there
1731                      are no overlaps.  */
1732                   else
1733                     {
1734                       *overlaps_a = conflict_fn_no_dependence ();
1735                       *overlaps_b = conflict_fn_no_dependence ();
1736                       *last_conflicts = integer_zero_node;
1737                       dependence_stats.num_siv_independent++;
1738                       return;
1739                     }
1740                 }
1741               else
1742                 {
1743                   /* Example:
1744                      chrec_a = 3
1745                      chrec_b = {4, +, 1}
1746
1747                      In this case, chrec_a will not overlap with chrec_b.  */
1748                   *overlaps_a = conflict_fn_no_dependence ();
1749                   *overlaps_b = conflict_fn_no_dependence ();
1750                   *last_conflicts = integer_zero_node;
1751                   dependence_stats.num_siv_independent++;
1752                   return;
1753                 }
1754             }
1755         }
1756     }
1757 }
1758
1759 /* Helper recursive function for initializing the matrix A.  Returns
1760    the initial value of CHREC.  */
1761
1762 static int
1763 initialize_matrix_A (lambda_matrix A, tree chrec, unsigned index, int mult)
1764 {
1765   gcc_assert (chrec);
1766
1767   if (TREE_CODE (chrec) != POLYNOMIAL_CHREC)
1768     return int_cst_value (chrec);
1769
1770   A[index][0] = mult * int_cst_value (CHREC_RIGHT (chrec));
1771   return initialize_matrix_A (A, CHREC_LEFT (chrec), index + 1, mult);
1772 }
1773
1774 #define FLOOR_DIV(x,y) ((x) / (y))
1775
1776 /* Solves the special case of the Diophantine equation:
1777    | {0, +, STEP_A}_x (OVERLAPS_A) = {0, +, STEP_B}_y (OVERLAPS_B)
1778
1779    Computes the descriptions OVERLAPS_A and OVERLAPS_B.  NITER is the
1780    number of iterations that loops X and Y run.  The overlaps will be
1781    constructed as evolutions in dimension DIM.  */
1782
1783 static void
1784 compute_overlap_steps_for_affine_univar (int niter, int step_a, int step_b,
1785                                          affine_fn *overlaps_a,
1786                                          affine_fn *overlaps_b,
1787                                          tree *last_conflicts, int dim)
1788 {
1789   if (((step_a > 0 && step_b > 0)
1790        || (step_a < 0 && step_b < 0)))
1791     {
1792       int step_overlaps_a, step_overlaps_b;
1793       int gcd_steps_a_b, last_conflict, tau2;
1794
1795       gcd_steps_a_b = gcd (step_a, step_b);
1796       step_overlaps_a = step_b / gcd_steps_a_b;
1797       step_overlaps_b = step_a / gcd_steps_a_b;
1798
1799       tau2 = FLOOR_DIV (niter, step_overlaps_a);
1800       tau2 = MIN (tau2, FLOOR_DIV (niter, step_overlaps_b));
1801       last_conflict = tau2;
1802
1803       *overlaps_a = affine_fn_univar (integer_zero_node, dim,
1804                                       build_int_cst (NULL_TREE,
1805                                                      step_overlaps_a));
1806       *overlaps_b = affine_fn_univar (integer_zero_node, dim,
1807                                       build_int_cst (NULL_TREE,
1808                                                      step_overlaps_b));
1809       *last_conflicts = build_int_cst (NULL_TREE, last_conflict);
1810     }
1811
1812   else
1813     {
1814       *overlaps_a = affine_fn_cst (integer_zero_node);
1815       *overlaps_b = affine_fn_cst (integer_zero_node);
1816       *last_conflicts = integer_zero_node;
1817     }
1818 }
1819
1820 /* Solves the special case of a Diophantine equation where CHREC_A is
1821    an affine bivariate function, and CHREC_B is an affine univariate
1822    function.  For example,
1823
1824    | {{0, +, 1}_x, +, 1335}_y = {0, +, 1336}_z
1825
1826    has the following overlapping functions:
1827
1828    | x (t, u, v) = {{0, +, 1336}_t, +, 1}_v
1829    | y (t, u, v) = {{0, +, 1336}_u, +, 1}_v
1830    | z (t, u, v) = {{{0, +, 1}_t, +, 1335}_u, +, 1}_v
1831
1832    FORNOW: This is a specialized implementation for a case occurring in
1833    a common benchmark.  Implement the general algorithm.  */
1834
1835 static void
1836 compute_overlap_steps_for_affine_1_2 (tree chrec_a, tree chrec_b,
1837                                       conflict_function **overlaps_a,
1838                                       conflict_function **overlaps_b,
1839                                       tree *last_conflicts)
1840 {
1841   bool xz_p, yz_p, xyz_p;
1842   int step_x, step_y, step_z;
1843   HOST_WIDE_INT niter_x, niter_y, niter_z, niter;
1844   affine_fn overlaps_a_xz, overlaps_b_xz;
1845   affine_fn overlaps_a_yz, overlaps_b_yz;
1846   affine_fn overlaps_a_xyz, overlaps_b_xyz;
1847   affine_fn ova1, ova2, ovb;
1848   tree last_conflicts_xz, last_conflicts_yz, last_conflicts_xyz;
1849
1850   step_x = int_cst_value (CHREC_RIGHT (CHREC_LEFT (chrec_a)));
1851   step_y = int_cst_value (CHREC_RIGHT (chrec_a));
1852   step_z = int_cst_value (CHREC_RIGHT (chrec_b));
1853
1854   niter_x = estimated_loop_iterations_int
1855                 (get_chrec_loop (CHREC_LEFT (chrec_a)), true);
1856   niter_y = estimated_loop_iterations_int (get_chrec_loop (chrec_a), true);
1857   niter_z = estimated_loop_iterations_int (get_chrec_loop (chrec_b), true);
1858
1859   if (niter_x < 0 || niter_y < 0 || niter_z < 0)
1860     {
1861       if (dump_file && (dump_flags & TDF_DETAILS))
1862         fprintf (dump_file, "overlap steps test failed: no iteration counts.\n");
1863
1864       *overlaps_a = conflict_fn_not_known ();
1865       *overlaps_b = conflict_fn_not_known ();
1866       *last_conflicts = chrec_dont_know;
1867       return;
1868     }
1869
1870   niter = MIN (niter_x, niter_z);
1871   compute_overlap_steps_for_affine_univar (niter, step_x, step_z,
1872                                            &overlaps_a_xz,
1873                                            &overlaps_b_xz,
1874                                            &last_conflicts_xz, 1);
1875   niter = MIN (niter_y, niter_z);
1876   compute_overlap_steps_for_affine_univar (niter, step_y, step_z,
1877                                            &overlaps_a_yz,
1878                                            &overlaps_b_yz,
1879                                            &last_conflicts_yz, 2);
1880   niter = MIN (niter_x, niter_z);
1881   niter = MIN (niter_y, niter);
1882   compute_overlap_steps_for_affine_univar (niter, step_x + step_y, step_z,
1883                                            &overlaps_a_xyz,
1884                                            &overlaps_b_xyz,
1885                                            &last_conflicts_xyz, 3);
1886
1887   xz_p = !integer_zerop (last_conflicts_xz);
1888   yz_p = !integer_zerop (last_conflicts_yz);
1889   xyz_p = !integer_zerop (last_conflicts_xyz);
1890
1891   if (xz_p || yz_p || xyz_p)
1892     {
1893       ova1 = affine_fn_cst (integer_zero_node);
1894       ova2 = affine_fn_cst (integer_zero_node);
1895       ovb = affine_fn_cst (integer_zero_node);
1896       if (xz_p)
1897         {
1898           affine_fn t0 = ova1;
1899           affine_fn t2 = ovb;
1900
1901           ova1 = affine_fn_plus (ova1, overlaps_a_xz);
1902           ovb = affine_fn_plus (ovb, overlaps_b_xz);
1903           affine_fn_free (t0);
1904           affine_fn_free (t2);
1905           *last_conflicts = last_conflicts_xz;
1906         }
1907       if (yz_p)
1908         {
1909           affine_fn t0 = ova2;
1910           affine_fn t2 = ovb;
1911
1912           ova2 = affine_fn_plus (ova2, overlaps_a_yz);
1913           ovb = affine_fn_plus (ovb, overlaps_b_yz);
1914           affine_fn_free (t0);
1915           affine_fn_free (t2);
1916           *last_conflicts = last_conflicts_yz;
1917         }
1918       if (xyz_p)
1919         {
1920           affine_fn t0 = ova1;
1921           affine_fn t2 = ova2;
1922           affine_fn t4 = ovb;
1923
1924           ova1 = affine_fn_plus (ova1, overlaps_a_xyz);
1925           ova2 = affine_fn_plus (ova2, overlaps_a_xyz);
1926           ovb = affine_fn_plus (ovb, overlaps_b_xyz);
1927           affine_fn_free (t0);
1928           affine_fn_free (t2);
1929           affine_fn_free (t4);
1930           *last_conflicts = last_conflicts_xyz;
1931         }
1932       *overlaps_a = conflict_fn (2, ova1, ova2);
1933       *overlaps_b = conflict_fn (1, ovb);
1934     }
1935   else
1936     {
1937       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1938       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
1939       *last_conflicts = integer_zero_node;
1940     }
1941
1942   affine_fn_free (overlaps_a_xz);
1943   affine_fn_free (overlaps_b_xz);
1944   affine_fn_free (overlaps_a_yz);
1945   affine_fn_free (overlaps_b_yz);
1946   affine_fn_free (overlaps_a_xyz);
1947   affine_fn_free (overlaps_b_xyz);
1948 }
1949
1950 /* Determines the overlapping elements due to accesses CHREC_A and
1951    CHREC_B, that are affine functions.  This function cannot handle
1952    symbolic evolution functions, ie. when initial conditions are
1953    parameters, because it uses lambda matrices of integers.  */
1954
1955 static void
1956 analyze_subscript_affine_affine (tree chrec_a,
1957                                  tree chrec_b,
1958                                  conflict_function **overlaps_a,
1959                                  conflict_function **overlaps_b,
1960                                  tree *last_conflicts)
1961 {
1962   unsigned nb_vars_a, nb_vars_b, dim;
1963   int init_a, init_b, gamma, gcd_alpha_beta;
1964   int tau1, tau2;
1965   lambda_matrix A, U, S;
1966
1967   if (eq_evolutions_p (chrec_a, chrec_b))
1968     {
1969       /* The accessed index overlaps for each iteration in the
1970          loop.  */
1971       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
1972       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
1973       *last_conflicts = chrec_dont_know;
1974       return;
1975     }
1976   if (dump_file && (dump_flags & TDF_DETAILS))
1977     fprintf (dump_file, "(analyze_subscript_affine_affine \n");
1978
1979   /* For determining the initial intersection, we have to solve a
1980      Diophantine equation.  This is the most time consuming part.
1981
1982      For answering to the question: "Is there a dependence?" we have
1983      to prove that there exists a solution to the Diophantine
1984      equation, and that the solution is in the iteration domain,
1985      i.e. the solution is positive or zero, and that the solution
1986      happens before the upper bound loop.nb_iterations.  Otherwise
1987      there is no dependence.  This function outputs a description of
1988      the iterations that hold the intersections.  */
1989
1990   nb_vars_a = nb_vars_in_chrec (chrec_a);
1991   nb_vars_b = nb_vars_in_chrec (chrec_b);
1992
1993   dim = nb_vars_a + nb_vars_b;
1994   U = lambda_matrix_new (dim, dim);
1995   A = lambda_matrix_new (dim, 1);
1996   S = lambda_matrix_new (dim, 1);
1997
1998   init_a = initialize_matrix_A (A, chrec_a, 0, 1);
1999   init_b = initialize_matrix_A (A, chrec_b, nb_vars_a, -1);
2000   gamma = init_b - init_a;
2001
2002   /* Don't do all the hard work of solving the Diophantine equation
2003      when we already know the solution: for example,
2004      | {3, +, 1}_1
2005      | {3, +, 4}_2
2006      | gamma = 3 - 3 = 0.
2007      Then the first overlap occurs during the first iterations:
2008      | {3, +, 1}_1 ({0, +, 4}_x) = {3, +, 4}_2 ({0, +, 1}_x)
2009   */
2010   if (gamma == 0)
2011     {
2012       if (nb_vars_a == 1 && nb_vars_b == 1)
2013         {
2014           int step_a, step_b;
2015           HOST_WIDE_INT niter, niter_a, niter_b;
2016           affine_fn ova, ovb;
2017
2018           niter_a = estimated_loop_iterations_int
2019                         (get_chrec_loop (chrec_a), true);
2020           niter_b = estimated_loop_iterations_int
2021                         (get_chrec_loop (chrec_b), true);
2022           if (niter_a < 0 || niter_b < 0)
2023             {
2024               if (dump_file && (dump_flags & TDF_DETAILS))
2025                 fprintf (dump_file, "affine-affine test failed: missing iteration counts.\n");
2026               *overlaps_a = conflict_fn_not_known ();
2027               *overlaps_b = conflict_fn_not_known ();
2028               *last_conflicts = chrec_dont_know;
2029               goto end_analyze_subs_aa;
2030             }
2031
2032           niter = MIN (niter_a, niter_b);
2033
2034           step_a = int_cst_value (CHREC_RIGHT (chrec_a));
2035           step_b = int_cst_value (CHREC_RIGHT (chrec_b));
2036
2037           compute_overlap_steps_for_affine_univar (niter, step_a, step_b,
2038                                                    &ova, &ovb,
2039                                                    last_conflicts, 1);
2040           *overlaps_a = conflict_fn (1, ova);
2041           *overlaps_b = conflict_fn (1, ovb);
2042         }
2043
2044       else if (nb_vars_a == 2 && nb_vars_b == 1)
2045         compute_overlap_steps_for_affine_1_2
2046           (chrec_a, chrec_b, overlaps_a, overlaps_b, last_conflicts);
2047
2048       else if (nb_vars_a == 1 && nb_vars_b == 2)
2049         compute_overlap_steps_for_affine_1_2
2050           (chrec_b, chrec_a, overlaps_b, overlaps_a, last_conflicts);
2051
2052       else
2053         {
2054           if (dump_file && (dump_flags & TDF_DETAILS))
2055             fprintf (dump_file, "affine-affine test failed: too many variables.\n");
2056           *overlaps_a = conflict_fn_not_known ();
2057           *overlaps_b = conflict_fn_not_known ();
2058           *last_conflicts = chrec_dont_know;
2059         }
2060       goto end_analyze_subs_aa;
2061     }
2062
2063   /* U.A = S */
2064   lambda_matrix_right_hermite (A, dim, 1, S, U);
2065
2066   if (S[0][0] < 0)
2067     {
2068       S[0][0] *= -1;
2069       lambda_matrix_row_negate (U, dim, 0);
2070     }
2071   gcd_alpha_beta = S[0][0];
2072
2073   /* Something went wrong: for example in {1, +, 0}_5 vs. {0, +, 0}_5,
2074      but that is a quite strange case.  Instead of ICEing, answer
2075      don't know.  */
2076   if (gcd_alpha_beta == 0)
2077     {
2078       *overlaps_a = conflict_fn_not_known ();
2079       *overlaps_b = conflict_fn_not_known ();
2080       *last_conflicts = chrec_dont_know;
2081       goto end_analyze_subs_aa;
2082     }
2083
2084   /* The classic "gcd-test".  */
2085   if (!int_divides_p (gcd_alpha_beta, gamma))
2086     {
2087       /* The "gcd-test" has determined that there is no integer
2088          solution, i.e. there is no dependence.  */
2089       *overlaps_a = conflict_fn_no_dependence ();
2090       *overlaps_b = conflict_fn_no_dependence ();
2091       *last_conflicts = integer_zero_node;
2092     }
2093
2094   /* Both access functions are univariate.  This includes SIV and MIV cases.  */
2095   else if (nb_vars_a == 1 && nb_vars_b == 1)
2096     {
2097       /* Both functions should have the same evolution sign.  */
2098       if (((A[0][0] > 0 && -A[1][0] > 0)
2099            || (A[0][0] < 0 && -A[1][0] < 0)))
2100         {
2101           /* The solutions are given by:
2102              |
2103              | [GAMMA/GCD_ALPHA_BETA  t].[u11 u12]  = [x0]
2104              |                           [u21 u22]    [y0]
2105
2106              For a given integer t.  Using the following variables,
2107
2108              | i0 = u11 * gamma / gcd_alpha_beta
2109              | j0 = u12 * gamma / gcd_alpha_beta
2110              | i1 = u21
2111              | j1 = u22
2112
2113              the solutions are:
2114
2115              | x0 = i0 + i1 * t,
2116              | y0 = j0 + j1 * t.  */
2117
2118           int i0, j0, i1, j1;
2119
2120           /* X0 and Y0 are the first iterations for which there is a
2121              dependence.  X0, Y0 are two solutions of the Diophantine
2122              equation: chrec_a (X0) = chrec_b (Y0).  */
2123           int x0, y0;
2124           int niter, niter_a, niter_b;
2125
2126           niter_a = estimated_loop_iterations_int
2127                         (get_chrec_loop (chrec_a), true);
2128           niter_b = estimated_loop_iterations_int
2129                         (get_chrec_loop (chrec_b), true);
2130
2131           if (niter_a < 0 || niter_b < 0)
2132             {
2133               if (dump_file && (dump_flags & TDF_DETAILS))
2134                 fprintf (dump_file, "affine-affine test failed: missing iteration counts.\n");
2135               *overlaps_a = conflict_fn_not_known ();
2136               *overlaps_b = conflict_fn_not_known ();
2137               *last_conflicts = chrec_dont_know;
2138               goto end_analyze_subs_aa;
2139             }
2140
2141           niter = MIN (niter_a, niter_b);
2142
2143           i0 = U[0][0] * gamma / gcd_alpha_beta;
2144           j0 = U[0][1] * gamma / gcd_alpha_beta;
2145           i1 = U[1][0];
2146           j1 = U[1][1];
2147
2148           if ((i1 == 0 && i0 < 0)
2149               || (j1 == 0 && j0 < 0))
2150             {
2151               /* There is no solution.
2152                  FIXME: The case "i0 > nb_iterations, j0 > nb_iterations"
2153                  falls in here, but for the moment we don't look at the
2154                  upper bound of the iteration domain.  */
2155               *overlaps_a = conflict_fn_no_dependence ();
2156               *overlaps_b = conflict_fn_no_dependence ();
2157               *last_conflicts = integer_zero_node;
2158             }
2159
2160           else
2161             {
2162               if (i1 > 0)
2163                 {
2164                   tau1 = CEIL (-i0, i1);
2165                   tau2 = FLOOR_DIV (niter - i0, i1);
2166
2167                   if (j1 > 0)
2168                     {
2169                       int last_conflict, min_multiple;
2170                       tau1 = MAX (tau1, CEIL (-j0, j1));
2171                       tau2 = MIN (tau2, FLOOR_DIV (niter - j0, j1));
2172
2173                       x0 = i1 * tau1 + i0;
2174                       y0 = j1 * tau1 + j0;
2175
2176                       /* At this point (x0, y0) is one of the
2177                          solutions to the Diophantine equation.  The
2178                          next step has to compute the smallest
2179                          positive solution: the first conflicts.  */
2180                       min_multiple = MIN (x0 / i1, y0 / j1);
2181                       x0 -= i1 * min_multiple;
2182                       y0 -= j1 * min_multiple;
2183
2184                       tau1 = (x0 - i0)/i1;
2185                       last_conflict = tau2 - tau1;
2186
2187                       /* If the overlap occurs outside of the bounds of the
2188                          loop, there is no dependence.  */
2189                       if (x0 > niter || y0  > niter)
2190                         {
2191                           *overlaps_a = conflict_fn_no_dependence ();
2192                           *overlaps_b = conflict_fn_no_dependence ();
2193                           *last_conflicts = integer_zero_node;
2194                         }
2195                       else
2196                         {
2197                           *overlaps_a
2198                             = conflict_fn (1,
2199                                 affine_fn_univar (build_int_cst (NULL_TREE, x0),
2200                                                   1,
2201                                                   build_int_cst (NULL_TREE, i1)));
2202                           *overlaps_b
2203                             = conflict_fn (1,
2204                                 affine_fn_univar (build_int_cst (NULL_TREE, y0),
2205                                                   1,
2206                                                   build_int_cst (NULL_TREE, j1)));
2207                           *last_conflicts = build_int_cst (NULL_TREE, last_conflict);
2208                         }
2209                     }
2210                   else
2211                     {
2212                       /* FIXME: For the moment, the upper bound of the
2213                          iteration domain for j is not checked.  */
2214                       if (dump_file && (dump_flags & TDF_DETAILS))
2215                         fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2216                       *overlaps_a = conflict_fn_not_known ();
2217                       *overlaps_b = conflict_fn_not_known ();
2218                       *last_conflicts = chrec_dont_know;
2219                     }
2220                 }
2221
2222               else
2223                 {
2224                   /* FIXME: For the moment, the upper bound of the
2225                      iteration domain for i is not checked.  */
2226                   if (dump_file && (dump_flags & TDF_DETAILS))
2227                     fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2228                   *overlaps_a = conflict_fn_not_known ();
2229                   *overlaps_b = conflict_fn_not_known ();
2230                   *last_conflicts = chrec_dont_know;
2231                 }
2232             }
2233         }
2234       else
2235         {
2236           if (dump_file && (dump_flags & TDF_DETAILS))
2237             fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2238           *overlaps_a = conflict_fn_not_known ();
2239           *overlaps_b = conflict_fn_not_known ();
2240           *last_conflicts = chrec_dont_know;
2241         }
2242     }
2243
2244   else
2245     {
2246       if (dump_file && (dump_flags & TDF_DETAILS))
2247         fprintf (dump_file, "affine-affine test failed: unimplemented.\n");
2248       *overlaps_a = conflict_fn_not_known ();
2249       *overlaps_b = conflict_fn_not_known ();
2250       *last_conflicts = chrec_dont_know;
2251     }
2252
2253 end_analyze_subs_aa:
2254   if (dump_file && (dump_flags & TDF_DETAILS))
2255     {
2256       fprintf (dump_file, "  (overlaps_a = ");
2257       dump_conflict_function (dump_file, *overlaps_a);
2258       fprintf (dump_file, ")\n  (overlaps_b = ");
2259       dump_conflict_function (dump_file, *overlaps_b);
2260       fprintf (dump_file, ")\n");
2261       fprintf (dump_file, ")\n");
2262     }
2263 }
2264
2265 /* Returns true when analyze_subscript_affine_affine can be used for
2266    determining the dependence relation between chrec_a and chrec_b,
2267    that contain symbols.  This function modifies chrec_a and chrec_b
2268    such that the analysis result is the same, and such that they don't
2269    contain symbols, and then can safely be passed to the analyzer.
2270
2271    Example: The analysis of the following tuples of evolutions produce
2272    the same results: {x+1, +, 1}_1 vs. {x+3, +, 1}_1, and {-2, +, 1}_1
2273    vs. {0, +, 1}_1
2274
2275    {x+1, +, 1}_1 ({2, +, 1}_1) = {x+3, +, 1}_1 ({0, +, 1}_1)
2276    {-2, +, 1}_1 ({2, +, 1}_1) = {0, +, 1}_1 ({0, +, 1}_1)
2277 */
2278
2279 static bool
2280 can_use_analyze_subscript_affine_affine (tree *chrec_a, tree *chrec_b)
2281 {
2282   tree diff, type, left_a, left_b, right_b;
2283
2284   if (chrec_contains_symbols (CHREC_RIGHT (*chrec_a))
2285       || chrec_contains_symbols (CHREC_RIGHT (*chrec_b)))
2286     /* FIXME: For the moment not handled.  Might be refined later.  */
2287     return false;
2288
2289   type = chrec_type (*chrec_a);
2290   left_a = CHREC_LEFT (*chrec_a);
2291   left_b = chrec_convert (type, CHREC_LEFT (*chrec_b), NULL_TREE);
2292   diff = chrec_fold_minus (type, left_a, left_b);
2293
2294   if (!evolution_function_is_constant_p (diff))
2295     return false;
2296
2297   if (dump_file && (dump_flags & TDF_DETAILS))
2298     fprintf (dump_file, "can_use_subscript_aff_aff_for_symbolic \n");
2299
2300   *chrec_a = build_polynomial_chrec (CHREC_VARIABLE (*chrec_a),
2301                                      diff, CHREC_RIGHT (*chrec_a));
2302   right_b = chrec_convert (type, CHREC_RIGHT (*chrec_b), NULL_TREE);
2303   *chrec_b = build_polynomial_chrec (CHREC_VARIABLE (*chrec_b),
2304                                      build_int_cst (type, 0),
2305                                      right_b);
2306   return true;
2307 }
2308
2309 /* Analyze a SIV (Single Index Variable) subscript.  *OVERLAPS_A and
2310    *OVERLAPS_B are initialized to the functions that describe the
2311    relation between the elements accessed twice by CHREC_A and
2312    CHREC_B.  For k >= 0, the following property is verified:
2313
2314    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
2315
2316 static void
2317 analyze_siv_subscript (tree chrec_a,
2318                        tree chrec_b,
2319                        conflict_function **overlaps_a,
2320                        conflict_function **overlaps_b,
2321                        tree *last_conflicts)
2322 {
2323   dependence_stats.num_siv++;
2324
2325   if (dump_file && (dump_flags & TDF_DETAILS))
2326     fprintf (dump_file, "(analyze_siv_subscript \n");
2327
2328   if (evolution_function_is_constant_p (chrec_a)
2329       && evolution_function_is_affine_p (chrec_b))
2330     analyze_siv_subscript_cst_affine (chrec_a, chrec_b,
2331                                       overlaps_a, overlaps_b, last_conflicts);
2332
2333   else if (evolution_function_is_affine_p (chrec_a)
2334            && evolution_function_is_constant_p (chrec_b))
2335     analyze_siv_subscript_cst_affine (chrec_b, chrec_a,
2336                                       overlaps_b, overlaps_a, last_conflicts);
2337
2338   else if (evolution_function_is_affine_p (chrec_a)
2339            && evolution_function_is_affine_p (chrec_b))
2340     {
2341       if (!chrec_contains_symbols (chrec_a)
2342           && !chrec_contains_symbols (chrec_b))
2343         {
2344           analyze_subscript_affine_affine (chrec_a, chrec_b,
2345                                            overlaps_a, overlaps_b,
2346                                            last_conflicts);
2347
2348           if (CF_NOT_KNOWN_P (*overlaps_a)
2349               || CF_NOT_KNOWN_P (*overlaps_b))
2350             dependence_stats.num_siv_unimplemented++;
2351           else if (CF_NO_DEPENDENCE_P (*overlaps_a)
2352                    || CF_NO_DEPENDENCE_P (*overlaps_b))
2353             dependence_stats.num_siv_independent++;
2354           else
2355             dependence_stats.num_siv_dependent++;
2356         }
2357       else if (can_use_analyze_subscript_affine_affine (&chrec_a,
2358                                                         &chrec_b))
2359         {
2360           analyze_subscript_affine_affine (chrec_a, chrec_b,
2361                                            overlaps_a, overlaps_b,
2362                                            last_conflicts);
2363           /* FIXME: The number of iterations is a symbolic expression.
2364              Compute it properly.  */
2365           *last_conflicts = chrec_dont_know;
2366
2367           if (CF_NOT_KNOWN_P (*overlaps_a)
2368               || CF_NOT_KNOWN_P (*overlaps_b))
2369             dependence_stats.num_siv_unimplemented++;
2370           else if (CF_NO_DEPENDENCE_P (*overlaps_a)
2371                    || CF_NO_DEPENDENCE_P (*overlaps_b))
2372             dependence_stats.num_siv_independent++;
2373           else
2374             dependence_stats.num_siv_dependent++;
2375         }
2376       else
2377         goto siv_subscript_dontknow;
2378     }
2379
2380   else
2381     {
2382     siv_subscript_dontknow:;
2383       if (dump_file && (dump_flags & TDF_DETAILS))
2384         fprintf (dump_file, "siv test failed: unimplemented.\n");
2385       *overlaps_a = conflict_fn_not_known ();
2386       *overlaps_b = conflict_fn_not_known ();
2387       *last_conflicts = chrec_dont_know;
2388       dependence_stats.num_siv_unimplemented++;
2389     }
2390
2391   if (dump_file && (dump_flags & TDF_DETAILS))
2392     fprintf (dump_file, ")\n");
2393 }
2394
2395 /* Returns false if we can prove that the greatest common divisor of the steps
2396    of CHREC does not divide CST, false otherwise.  */
2397
2398 static bool
2399 gcd_of_steps_may_divide_p (tree chrec, tree cst)
2400 {
2401   HOST_WIDE_INT cd = 0, val;
2402   tree step;
2403
2404   if (!host_integerp (cst, 0))
2405     return true;
2406   val = tree_low_cst (cst, 0);
2407
2408   while (TREE_CODE (chrec) == POLYNOMIAL_CHREC)
2409     {
2410       step = CHREC_RIGHT (chrec);
2411       if (!host_integerp (step, 0))
2412         return true;
2413       cd = gcd (cd, tree_low_cst (step, 0));
2414       chrec = CHREC_LEFT (chrec);
2415     }
2416
2417   return val % cd == 0;
2418 }
2419
2420 /* Analyze a MIV (Multiple Index Variable) subscript.  *OVERLAPS_A and
2421    *OVERLAPS_B are initialized to the functions that describe the
2422    relation between the elements accessed twice by CHREC_A and
2423    CHREC_B.  For k >= 0, the following property is verified:
2424
2425    CHREC_A (*OVERLAPS_A (k)) = CHREC_B (*OVERLAPS_B (k)).  */
2426
2427 static void
2428 analyze_miv_subscript (tree chrec_a,
2429                        tree chrec_b,
2430                        conflict_function **overlaps_a,
2431                        conflict_function **overlaps_b,
2432                        tree *last_conflicts)
2433 {
2434   /* FIXME:  This is a MIV subscript, not yet handled.
2435      Example: (A[{1, +, 1}_1] vs. A[{1, +, 1}_2]) that comes from
2436      (A[i] vs. A[j]).
2437
2438      In the SIV test we had to solve a Diophantine equation with two
2439      variables.  In the MIV case we have to solve a Diophantine
2440      equation with 2*n variables (if the subscript uses n IVs).
2441   */
2442   tree difference;
2443   dependence_stats.num_miv++;
2444   if (dump_file && (dump_flags & TDF_DETAILS))
2445     fprintf (dump_file, "(analyze_miv_subscript \n");
2446
2447   chrec_a = chrec_convert (integer_type_node, chrec_a, NULL_TREE);
2448   chrec_b = chrec_convert (integer_type_node, chrec_b, NULL_TREE);
2449   difference = chrec_fold_minus (integer_type_node, chrec_a, chrec_b);
2450
2451   if (eq_evolutions_p (chrec_a, chrec_b))
2452     {
2453       /* Access functions are the same: all the elements are accessed
2454          in the same order.  */
2455       *overlaps_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2456       *overlaps_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
2457       *last_conflicts = estimated_loop_iterations_tree
2458                                 (get_chrec_loop (chrec_a), true);
2459       dependence_stats.num_miv_dependent++;
2460     }
2461
2462   else if (evolution_function_is_constant_p (difference)
2463            /* For the moment, the following is verified:
2464               evolution_function_is_affine_multivariate_p (chrec_a, 0) */
2465            && !gcd_of_steps_may_divide_p (chrec_a, difference))
2466     {
2467       /* testsuite/.../ssa-chrec-33.c
2468          {{21, +, 2}_1, +, -2}_2  vs.  {{20, +, 2}_1, +, -2}_2
2469
2470          The difference is 1, and all the evolution steps are multiples
2471          of 2, consequently there are no overlapping elements.  */
2472       *overlaps_a = conflict_fn_no_dependence ();
2473       *overlaps_b = conflict_fn_no_dependence ();
2474       *last_conflicts = integer_zero_node;
2475       dependence_stats.num_miv_independent++;
2476     }
2477
2478   else if (evolution_function_is_affine_multivariate_p (chrec_a, 0)
2479            && !chrec_contains_symbols (chrec_a)
2480            && evolution_function_is_affine_multivariate_p (chrec_b, 0)
2481            && !chrec_contains_symbols (chrec_b))
2482     {
2483       /* testsuite/.../ssa-chrec-35.c
2484          {0, +, 1}_2  vs.  {0, +, 1}_3
2485          the overlapping elements are respectively located at iterations:
2486          {0, +, 1}_x and {0, +, 1}_x,
2487          in other words, we have the equality:
2488          {0, +, 1}_2 ({0, +, 1}_x) = {0, +, 1}_3 ({0, +, 1}_x)
2489
2490          Other examples:
2491          {{0, +, 1}_1, +, 2}_2 ({0, +, 1}_x, {0, +, 1}_y) =
2492          {0, +, 1}_1 ({{0, +, 1}_x, +, 2}_y)
2493
2494          {{0, +, 2}_1, +, 3}_2 ({0, +, 1}_y, {0, +, 1}_x) =
2495          {{0, +, 3}_1, +, 2}_2 ({0, +, 1}_x, {0, +, 1}_y)
2496       */
2497       analyze_subscript_affine_affine (chrec_a, chrec_b,
2498                                        overlaps_a, overlaps_b, last_conflicts);
2499
2500       if (CF_NOT_KNOWN_P (*overlaps_a)
2501           || CF_NOT_KNOWN_P (*overlaps_b))
2502         dependence_stats.num_miv_unimplemented++;
2503       else if (CF_NO_DEPENDENCE_P (*overlaps_a)
2504                || CF_NO_DEPENDENCE_P (*overlaps_b))
2505         dependence_stats.num_miv_independent++;
2506       else
2507         dependence_stats.num_miv_dependent++;
2508     }
2509
2510   else
2511     {
2512       /* When the analysis is too difficult, answer "don't know".  */
2513       if (dump_file && (dump_flags & TDF_DETAILS))
2514         fprintf (dump_file, "analyze_miv_subscript test failed: unimplemented.\n");
2515
2516       *overlaps_a = conflict_fn_not_known ();
2517       *overlaps_b = conflict_fn_not_known ();
2518       *last_conflicts = chrec_dont_know;
2519       dependence_stats.num_miv_unimplemented++;
2520     }
2521
2522   if (dump_file && (dump_flags & TDF_DETAILS))
2523     fprintf (dump_file, ")\n");
2524 }
2525
2526 /* Determines the iterations for which CHREC_A is equal to CHREC_B.
2527    OVERLAP_ITERATIONS_A and OVERLAP_ITERATIONS_B are initialized with
2528    two functions that describe the iterations that contain conflicting
2529    elements.
2530
2531    Remark: For an integer k >= 0, the following equality is true:
2532
2533    CHREC_A (OVERLAP_ITERATIONS_A (k)) == CHREC_B (OVERLAP_ITERATIONS_B (k)).
2534 */
2535
2536 static void
2537 analyze_overlapping_iterations (tree chrec_a,
2538                                 tree chrec_b,
2539                                 conflict_function **overlap_iterations_a,
2540                                 conflict_function **overlap_iterations_b,
2541                                 tree *last_conflicts)
2542 {
2543   dependence_stats.num_subscript_tests++;
2544
2545   if (dump_file && (dump_flags & TDF_DETAILS))
2546     {
2547       fprintf (dump_file, "(analyze_overlapping_iterations \n");
2548       fprintf (dump_file, "  (chrec_a = ");
2549       print_generic_expr (dump_file, chrec_a, 0);
2550       fprintf (dump_file, ")\n  (chrec_b = ");
2551       print_generic_expr (dump_file, chrec_b, 0);
2552       fprintf (dump_file, ")\n");
2553     }
2554
2555   if (chrec_a == NULL_TREE
2556       || chrec_b == NULL_TREE
2557       || chrec_contains_undetermined (chrec_a)
2558       || chrec_contains_undetermined (chrec_b))
2559     {
2560       dependence_stats.num_subscript_undetermined++;
2561
2562       *overlap_iterations_a = conflict_fn_not_known ();
2563       *overlap_iterations_b = conflict_fn_not_known ();
2564     }
2565
2566   /* If they are the same chrec, and are affine, they overlap
2567      on every iteration.  */
2568   else if (eq_evolutions_p (chrec_a, chrec_b)
2569            && evolution_function_is_affine_multivariate_p (chrec_a, 0))
2570     {
2571       dependence_stats.num_same_subscript_function++;
2572       *overlap_iterations_a = conflict_fn (1, affine_fn_cst (integer_zero_node));
2573       *overlap_iterations_b = conflict_fn (1, affine_fn_cst (integer_zero_node));
2574       *last_conflicts = chrec_dont_know;
2575     }
2576
2577   /* If they aren't the same, and aren't affine, we can't do anything
2578      yet. */
2579   else if ((chrec_contains_symbols (chrec_a)
2580             || chrec_contains_symbols (chrec_b))
2581            && (!evolution_function_is_affine_multivariate_p (chrec_a, 0)
2582                || !evolution_function_is_affine_multivariate_p (chrec_b, 0)))
2583     {
2584       dependence_stats.num_subscript_undetermined++;
2585       *overlap_iterations_a = conflict_fn_not_known ();
2586       *overlap_iterations_b = conflict_fn_not_known ();
2587     }
2588
2589   else if (ziv_subscript_p (chrec_a, chrec_b))
2590     analyze_ziv_subscript (chrec_a, chrec_b,
2591                            overlap_iterations_a, overlap_iterations_b,
2592                            last_conflicts);
2593
2594   else if (siv_subscript_p (chrec_a, chrec_b))
2595     analyze_siv_subscript (chrec_a, chrec_b,
2596                            overlap_iterations_a, overlap_iterations_b,
2597                            last_conflicts);
2598
2599   else
2600     analyze_miv_subscript (chrec_a, chrec_b,
2601                            overlap_iterations_a, overlap_iterations_b,
2602                            last_conflicts);
2603
2604   if (dump_file && (dump_flags & TDF_DETAILS))
2605     {
2606       fprintf (dump_file, "  (overlap_iterations_a = ");
2607       dump_conflict_function (dump_file, *overlap_iterations_a);
2608       fprintf (dump_file, ")\n  (overlap_iterations_b = ");
2609       dump_conflict_function (dump_file, *overlap_iterations_b);
2610       fprintf (dump_file, ")\n");
2611       fprintf (dump_file, ")\n");
2612     }
2613 }
2614
2615 /* Helper function for uniquely inserting distance vectors.  */
2616
2617 static void
2618 save_dist_v (struct data_dependence_relation *ddr, lambda_vector dist_v)
2619 {
2620   unsigned i;
2621   lambda_vector v;
2622
2623   for (i = 0; VEC_iterate (lambda_vector, DDR_DIST_VECTS (ddr), i, v); i++)
2624     if (lambda_vector_equal (v, dist_v, DDR_NB_LOOPS (ddr)))
2625       return;
2626
2627   VEC_safe_push (lambda_vector, heap, DDR_DIST_VECTS (ddr), dist_v);
2628 }
2629
2630 /* Helper function for uniquely inserting direction vectors.  */
2631
2632 static void
2633 save_dir_v (struct data_dependence_relation *ddr, lambda_vector dir_v)
2634 {
2635   unsigned i;
2636   lambda_vector v;
2637
2638   for (i = 0; VEC_iterate (lambda_vector, DDR_DIR_VECTS (ddr), i, v); i++)
2639     if (lambda_vector_equal (v, dir_v, DDR_NB_LOOPS (ddr)))
2640       return;
2641
2642   VEC_safe_push (lambda_vector, heap, DDR_DIR_VECTS (ddr), dir_v);
2643 }
2644
2645 /* Add a distance of 1 on all the loops outer than INDEX.  If we
2646    haven't yet determined a distance for this outer loop, push a new
2647    distance vector composed of the previous distance, and a distance
2648    of 1 for this outer loop.  Example:
2649
2650    | loop_1
2651    |   loop_2
2652    |     A[10]
2653    |   endloop_2
2654    | endloop_1
2655
2656    Saved vectors are of the form (dist_in_1, dist_in_2).  First, we
2657    save (0, 1), then we have to save (1, 0).  */
2658
2659 static void
2660 add_outer_distances (struct data_dependence_relation *ddr,
2661                      lambda_vector dist_v, int index)
2662 {
2663   /* For each outer loop where init_v is not set, the accesses are
2664      in dependence of distance 1 in the loop.  */
2665   while (--index >= 0)
2666     {
2667       lambda_vector save_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
2668       lambda_vector_copy (dist_v, save_v, DDR_NB_LOOPS (ddr));
2669       save_v[index] = 1;
2670       save_dist_v (ddr, save_v);
2671     }
2672 }
2673
2674 /* Return false when fail to represent the data dependence as a
2675    distance vector.  INIT_B is set to true when a component has been
2676    added to the distance vector DIST_V.  INDEX_CARRY is then set to
2677    the index in DIST_V that carries the dependence.  */
2678
2679 static bool
2680 build_classic_dist_vector_1 (struct data_dependence_relation *ddr,
2681                              struct data_reference *ddr_a,
2682                              struct data_reference *ddr_b,
2683                              lambda_vector dist_v, bool *init_b,
2684                              int *index_carry)
2685 {
2686   unsigned i;
2687   lambda_vector init_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
2688
2689   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
2690     {
2691       tree access_fn_a, access_fn_b;
2692       struct subscript *subscript = DDR_SUBSCRIPT (ddr, i);
2693
2694       if (chrec_contains_undetermined (SUB_DISTANCE (subscript)))
2695         {
2696           non_affine_dependence_relation (ddr);
2697           return false;
2698         }
2699
2700       access_fn_a = DR_ACCESS_FN (ddr_a, i);
2701       access_fn_b = DR_ACCESS_FN (ddr_b, i);
2702
2703       if (TREE_CODE (access_fn_a) == POLYNOMIAL_CHREC
2704           && TREE_CODE (access_fn_b) == POLYNOMIAL_CHREC)
2705         {
2706           int dist, index;
2707           int index_a = index_in_loop_nest (CHREC_VARIABLE (access_fn_a),
2708                                             DDR_LOOP_NEST (ddr));
2709           int index_b = index_in_loop_nest (CHREC_VARIABLE (access_fn_b),
2710                                             DDR_LOOP_NEST (ddr));
2711
2712           /* The dependence is carried by the outermost loop.  Example:
2713              | loop_1
2714              |   A[{4, +, 1}_1]
2715              |   loop_2
2716              |     A[{5, +, 1}_2]
2717              |   endloop_2
2718              | endloop_1
2719              In this case, the dependence is carried by loop_1.  */
2720           index = index_a < index_b ? index_a : index_b;
2721           *index_carry = MIN (index, *index_carry);
2722
2723           if (chrec_contains_undetermined (SUB_DISTANCE (subscript)))
2724             {
2725               non_affine_dependence_relation (ddr);
2726               return false;
2727             }
2728
2729           dist = int_cst_value (SUB_DISTANCE (subscript));
2730
2731           /* This is the subscript coupling test.  If we have already
2732              recorded a distance for this loop (a distance coming from
2733              another subscript), it should be the same.  For example,
2734              in the following code, there is no dependence:
2735
2736              | loop i = 0, N, 1
2737              |   T[i+1][i] = ...
2738              |   ... = T[i][i]
2739              | endloop
2740           */
2741           if (init_v[index] != 0 && dist_v[index] != dist)
2742             {
2743               finalize_ddr_dependent (ddr, chrec_known);
2744               return false;
2745             }
2746
2747           dist_v[index] = dist;
2748           init_v[index] = 1;
2749           *init_b = true;
2750         }
2751       else if (!operand_equal_p (access_fn_a, access_fn_b, 0))
2752         {
2753           /* This can be for example an affine vs. constant dependence
2754              (T[i] vs. T[3]) that is not an affine dependence and is
2755              not representable as a distance vector.  */
2756           non_affine_dependence_relation (ddr);
2757           return false;
2758         }
2759     }
2760
2761   return true;
2762 }
2763
2764 /* Return true when the DDR contains two data references that have the
2765    same access functions.  */
2766
2767 static bool
2768 same_access_functions (struct data_dependence_relation *ddr)
2769 {
2770   unsigned i;
2771
2772   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
2773     if (!eq_evolutions_p (DR_ACCESS_FN (DDR_A (ddr), i),
2774                           DR_ACCESS_FN (DDR_B (ddr), i)))
2775       return false;
2776
2777   return true;
2778 }
2779
2780 /* Return true when the DDR contains only constant access functions.  */
2781
2782 static bool
2783 constant_access_functions (struct data_dependence_relation *ddr)
2784 {
2785   unsigned i;
2786
2787   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
2788     if (!evolution_function_is_constant_p (DR_ACCESS_FN (DDR_A (ddr), i))
2789         || !evolution_function_is_constant_p (DR_ACCESS_FN (DDR_B (ddr), i)))
2790       return false;
2791
2792   return true;
2793 }
2794
2795
2796 /* Helper function for the case where DDR_A and DDR_B are the same
2797    multivariate access function.  */
2798
2799 static void
2800 add_multivariate_self_dist (struct data_dependence_relation *ddr, tree c_2)
2801 {
2802   int x_1, x_2;
2803   tree c_1 = CHREC_LEFT (c_2);
2804   tree c_0 = CHREC_LEFT (c_1);
2805   lambda_vector dist_v;
2806   int v1, v2, cd;
2807
2808   /* Polynomials with more than 2 variables are not handled yet.  */
2809   if (TREE_CODE (c_0) != INTEGER_CST)
2810     {
2811       DDR_ARE_DEPENDENT (ddr) = chrec_dont_know;
2812       return;
2813     }
2814
2815   x_2 = index_in_loop_nest (CHREC_VARIABLE (c_2), DDR_LOOP_NEST (ddr));
2816   x_1 = index_in_loop_nest (CHREC_VARIABLE (c_1), DDR_LOOP_NEST (ddr));
2817
2818   /* For "{{0, +, 2}_1, +, 3}_2" the distance vector is (3, -2).  */
2819   dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
2820   v1 = int_cst_value (CHREC_RIGHT (c_1));
2821   v2 = int_cst_value (CHREC_RIGHT (c_2));
2822   cd = gcd (v1, v2);
2823   v1 /= cd;
2824   v2 /= cd;
2825
2826   if (v2 < 0)
2827     {
2828       v2 = -v2;
2829       v1 = -v1;
2830     }
2831
2832   dist_v[x_1] = v2;
2833   dist_v[x_2] = -v1;
2834   save_dist_v (ddr, dist_v);
2835
2836   add_outer_distances (ddr, dist_v, x_1);
2837 }
2838
2839 /* Helper function for the case where DDR_A and DDR_B are the same
2840    access functions.  */
2841
2842 static void
2843 add_other_self_distances (struct data_dependence_relation *ddr)
2844 {
2845   lambda_vector dist_v;
2846   unsigned i;
2847   int index_carry = DDR_NB_LOOPS (ddr);
2848
2849   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
2850     {
2851       tree access_fun = DR_ACCESS_FN (DDR_A (ddr), i);
2852
2853       if (TREE_CODE (access_fun) == POLYNOMIAL_CHREC)
2854         {
2855           if (!evolution_function_is_univariate_p (access_fun))
2856             {
2857               if (DDR_NUM_SUBSCRIPTS (ddr) != 1)
2858                 {
2859                   DDR_ARE_DEPENDENT (ddr) = chrec_dont_know;
2860                   return;
2861                 }
2862
2863               add_multivariate_self_dist (ddr, DR_ACCESS_FN (DDR_A (ddr), 0));
2864               return;
2865             }
2866
2867           index_carry = MIN (index_carry,
2868                              index_in_loop_nest (CHREC_VARIABLE (access_fun),
2869                                                  DDR_LOOP_NEST (ddr)));
2870         }
2871     }
2872
2873   dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
2874   add_outer_distances (ddr, dist_v, index_carry);
2875 }
2876
2877 static void
2878 insert_innermost_unit_dist_vector (struct data_dependence_relation *ddr)
2879 {
2880   lambda_vector dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
2881
2882   dist_v[DDR_INNER_LOOP (ddr)] = 1;
2883   save_dist_v (ddr, dist_v);
2884 }
2885
2886 /* Adds a unit distance vector to DDR when there is a 0 overlap.  This
2887    is the case for example when access functions are the same and
2888    equal to a constant, as in:
2889
2890    | loop_1
2891    |   A[3] = ...
2892    |   ... = A[3]
2893    | endloop_1
2894
2895    in which case the distance vectors are (0) and (1).  */
2896
2897 static void
2898 add_distance_for_zero_overlaps (struct data_dependence_relation *ddr)
2899 {
2900   unsigned i, j;
2901
2902   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
2903     {
2904       subscript_p sub = DDR_SUBSCRIPT (ddr, i);
2905       conflict_function *ca = SUB_CONFLICTS_IN_A (sub);
2906       conflict_function *cb = SUB_CONFLICTS_IN_B (sub);
2907
2908       for (j = 0; j < ca->n; j++)
2909         if (affine_function_zero_p (ca->fns[j]))
2910           {
2911             insert_innermost_unit_dist_vector (ddr);
2912             return;
2913           }
2914
2915       for (j = 0; j < cb->n; j++)
2916         if (affine_function_zero_p (cb->fns[j]))
2917           {
2918             insert_innermost_unit_dist_vector (ddr);
2919             return;
2920           }
2921     }
2922 }
2923
2924 /* Compute the classic per loop distance vector.  DDR is the data
2925    dependence relation to build a vector from.  Return false when fail
2926    to represent the data dependence as a distance vector.  */
2927
2928 static bool
2929 build_classic_dist_vector (struct data_dependence_relation *ddr)
2930 {
2931   bool init_b = false;
2932   int index_carry = DDR_NB_LOOPS (ddr);
2933   lambda_vector dist_v;
2934
2935   if (DDR_ARE_DEPENDENT (ddr) != NULL_TREE)
2936     return true;
2937
2938   if (same_access_functions (ddr))
2939     {
2940       /* Save the 0 vector.  */
2941       dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
2942       save_dist_v (ddr, dist_v);
2943
2944       if (constant_access_functions (ddr))
2945         add_distance_for_zero_overlaps (ddr);
2946
2947       if (DDR_NB_LOOPS (ddr) > 1)
2948         add_other_self_distances (ddr);
2949
2950       return true;
2951     }
2952
2953   dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
2954   if (!build_classic_dist_vector_1 (ddr, DDR_A (ddr), DDR_B (ddr),
2955                                     dist_v, &init_b, &index_carry))
2956     return false;
2957
2958   /* Save the distance vector if we initialized one.  */
2959   if (init_b)
2960     {
2961       /* Verify a basic constraint: classic distance vectors should
2962          always be lexicographically positive.
2963
2964          Data references are collected in the order of execution of
2965          the program, thus for the following loop
2966
2967          | for (i = 1; i < 100; i++)
2968          |   for (j = 1; j < 100; j++)
2969          |     {
2970          |       t = T[j+1][i-1];  // A
2971          |       T[j][i] = t + 2;  // B
2972          |     }
2973
2974          references are collected following the direction of the wind:
2975          A then B.  The data dependence tests are performed also
2976          following this order, such that we're looking at the distance
2977          separating the elements accessed by A from the elements later
2978          accessed by B.  But in this example, the distance returned by
2979          test_dep (A, B) is lexicographically negative (-1, 1), that
2980          means that the access A occurs later than B with respect to
2981          the outer loop, ie. we're actually looking upwind.  In this
2982          case we solve test_dep (B, A) looking downwind to the
2983          lexicographically positive solution, that returns the
2984          distance vector (1, -1).  */
2985       if (!lambda_vector_lexico_pos (dist_v, DDR_NB_LOOPS (ddr)))
2986         {
2987           lambda_vector save_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
2988           subscript_dependence_tester_1 (ddr, DDR_B (ddr), DDR_A (ddr));
2989           compute_subscript_distance (ddr);
2990           build_classic_dist_vector_1 (ddr, DDR_B (ddr), DDR_A (ddr),
2991                                        save_v, &init_b, &index_carry);
2992           save_dist_v (ddr, save_v);
2993
2994           /* In this case there is a dependence forward for all the
2995              outer loops:
2996
2997              | for (k = 1; k < 100; k++)
2998              |  for (i = 1; i < 100; i++)
2999              |   for (j = 1; j < 100; j++)
3000              |     {
3001              |       t = T[j+1][i-1];  // A
3002              |       T[j][i] = t + 2;  // B
3003              |     }
3004
3005              the vectors are:
3006              (0,  1, -1)
3007              (1,  1, -1)
3008              (1, -1,  1)
3009           */
3010           if (DDR_NB_LOOPS (ddr) > 1)
3011             {
3012               add_outer_distances (ddr, save_v, index_carry);
3013               add_outer_distances (ddr, dist_v, index_carry);
3014             }
3015         }
3016       else
3017         {
3018           lambda_vector save_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3019           lambda_vector_copy (dist_v, save_v, DDR_NB_LOOPS (ddr));
3020           save_dist_v (ddr, save_v);
3021
3022           if (DDR_NB_LOOPS (ddr) > 1)
3023             {
3024               lambda_vector opposite_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3025
3026               subscript_dependence_tester_1 (ddr, DDR_B (ddr), DDR_A (ddr));
3027               compute_subscript_distance (ddr);
3028               build_classic_dist_vector_1 (ddr, DDR_B (ddr), DDR_A (ddr),
3029                                            opposite_v, &init_b, &index_carry);
3030
3031               add_outer_distances (ddr, dist_v, index_carry);
3032               add_outer_distances (ddr, opposite_v, index_carry);
3033             }
3034         }
3035     }
3036   else
3037     {
3038       /* There is a distance of 1 on all the outer loops: Example:
3039          there is a dependence of distance 1 on loop_1 for the array A.
3040
3041          | loop_1
3042          |   A[5] = ...
3043          | endloop
3044       */
3045       add_outer_distances (ddr, dist_v,
3046                            lambda_vector_first_nz (dist_v,
3047                                                    DDR_NB_LOOPS (ddr), 0));
3048     }
3049
3050   if (dump_file && (dump_flags & TDF_DETAILS))
3051     {
3052       unsigned i;
3053
3054       fprintf (dump_file, "(build_classic_dist_vector\n");
3055       for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
3056         {
3057           fprintf (dump_file, "  dist_vector = (");
3058           print_lambda_vector (dump_file, DDR_DIST_VECT (ddr, i),
3059                                DDR_NB_LOOPS (ddr));
3060           fprintf (dump_file, "  )\n");
3061         }
3062       fprintf (dump_file, ")\n");
3063     }
3064
3065   return true;
3066 }
3067
3068 /* Return the direction for a given distance.
3069    FIXME: Computing dir this way is suboptimal, since dir can catch
3070    cases that dist is unable to represent.  */
3071
3072 static inline enum data_dependence_direction
3073 dir_from_dist (int dist)
3074 {
3075   if (dist > 0)
3076     return dir_positive;
3077   else if (dist < 0)
3078     return dir_negative;
3079   else
3080     return dir_equal;
3081 }
3082
3083 /* Compute the classic per loop direction vector.  DDR is the data
3084    dependence relation to build a vector from.  */
3085
3086 static void
3087 build_classic_dir_vector (struct data_dependence_relation *ddr)
3088 {
3089   unsigned i, j;
3090   lambda_vector dist_v;
3091
3092   for (i = 0; VEC_iterate (lambda_vector, DDR_DIST_VECTS (ddr), i, dist_v); i++)
3093     {
3094       lambda_vector dir_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3095
3096       for (j = 0; j < DDR_NB_LOOPS (ddr); j++)
3097         dir_v[j] = dir_from_dist (dist_v[j]);
3098
3099       save_dir_v (ddr, dir_v);
3100     }
3101 }
3102
3103 /* Helper function.  Returns true when there is a dependence between
3104    data references DRA and DRB.  */
3105
3106 static bool
3107 subscript_dependence_tester_1 (struct data_dependence_relation *ddr,
3108                                struct data_reference *dra,
3109                                struct data_reference *drb)
3110 {
3111   unsigned int i;
3112   tree last_conflicts;
3113   struct subscript *subscript;
3114
3115   for (i = 0; VEC_iterate (subscript_p, DDR_SUBSCRIPTS (ddr), i, subscript);
3116        i++)
3117     {
3118       conflict_function *overlaps_a, *overlaps_b;
3119
3120       analyze_overlapping_iterations (DR_ACCESS_FN (dra, i),
3121                                       DR_ACCESS_FN (drb, i),
3122                                       &overlaps_a, &overlaps_b,
3123                                       &last_conflicts);
3124
3125       if (CF_NOT_KNOWN_P (overlaps_a)
3126           || CF_NOT_KNOWN_P (overlaps_b))
3127         {
3128           finalize_ddr_dependent (ddr, chrec_dont_know);
3129           dependence_stats.num_dependence_undetermined++;
3130           free_conflict_function (overlaps_a);
3131           free_conflict_function (overlaps_b);
3132           return false;
3133         }
3134
3135       else if (CF_NO_DEPENDENCE_P (overlaps_a)
3136                || CF_NO_DEPENDENCE_P (overlaps_b))
3137         {
3138           finalize_ddr_dependent (ddr, chrec_known);
3139           dependence_stats.num_dependence_independent++;
3140           free_conflict_function (overlaps_a);
3141           free_conflict_function (overlaps_b);
3142           return false;
3143         }
3144
3145       else
3146         {
3147           SUB_CONFLICTS_IN_A (subscript) = overlaps_a;
3148           SUB_CONFLICTS_IN_B (subscript) = overlaps_b;
3149           SUB_LAST_CONFLICT (subscript) = last_conflicts;
3150         }
3151     }
3152
3153   return true;
3154 }
3155
3156 /* Computes the conflicting iterations, and initialize DDR.  */
3157
3158 static void
3159 subscript_dependence_tester (struct data_dependence_relation *ddr)
3160 {
3161
3162   if (dump_file && (dump_flags & TDF_DETAILS))
3163     fprintf (dump_file, "(subscript_dependence_tester \n");
3164
3165   if (subscript_dependence_tester_1 (ddr, DDR_A (ddr), DDR_B (ddr)))
3166     dependence_stats.num_dependence_dependent++;
3167
3168   compute_subscript_distance (ddr);
3169   if (build_classic_dist_vector (ddr))
3170     build_classic_dir_vector (ddr);
3171
3172   if (dump_file && (dump_flags & TDF_DETAILS))
3173     fprintf (dump_file, ")\n");
3174 }
3175
3176 /* Returns true when all the access functions of A are affine or
3177    constant.  */
3178
3179 static bool
3180 access_functions_are_affine_or_constant_p (struct data_reference *a)
3181 {
3182   unsigned int i;
3183   VEC(tree,heap) *fns = DR_ACCESS_FNS (a);
3184   tree t;
3185
3186   for (i = 0; VEC_iterate (tree, fns, i, t); i++)
3187     if (!evolution_function_is_constant_p (t)
3188         && !evolution_function_is_affine_multivariate_p (t, 0))
3189       return false;
3190
3191   return true;
3192 }
3193
3194 /* Initializes an equation for an OMEGA problem using the information
3195    contained in the ACCESS_FUN.  Returns true when the operation
3196    succeeded.
3197
3198    PB is the omega constraint system.
3199    EQ is the number of the equation to be initialized.
3200    OFFSET is used for shifting the variables names in the constraints:
3201    a constrain is composed of 2 * the number of variables surrounding
3202    dependence accesses.  OFFSET is set either to 0 for the first n variables,
3203    then it is set to n.
3204    ACCESS_FUN is expected to be an affine chrec.  */
3205
3206 static bool
3207 init_omega_eq_with_af (omega_pb pb, unsigned eq,
3208                        unsigned int offset, tree access_fun,
3209                        struct data_dependence_relation *ddr)
3210 {
3211   switch (TREE_CODE (access_fun))
3212     {
3213     case POLYNOMIAL_CHREC:
3214       {
3215         tree left = CHREC_LEFT (access_fun);
3216         tree right = CHREC_RIGHT (access_fun);
3217         int var = CHREC_VARIABLE (access_fun);
3218         unsigned var_idx;
3219
3220         if (TREE_CODE (right) != INTEGER_CST)
3221           return false;
3222
3223         var_idx = index_in_loop_nest (var, DDR_LOOP_NEST (ddr));
3224         pb->eqs[eq].coef[offset + var_idx + 1] = int_cst_value (right);
3225
3226         /* Compute the innermost loop index.  */
3227         DDR_INNER_LOOP (ddr) = MAX (DDR_INNER_LOOP (ddr), var_idx);
3228
3229         if (offset == 0)
3230           pb->eqs[eq].coef[var_idx + DDR_NB_LOOPS (ddr) + 1]
3231             += int_cst_value (right);
3232
3233         switch (TREE_CODE (left))
3234           {
3235           case POLYNOMIAL_CHREC:
3236             return init_omega_eq_with_af (pb, eq, offset, left, ddr);
3237
3238           case INTEGER_CST:
3239             pb->eqs[eq].coef[0] += int_cst_value (left);
3240             return true;
3241
3242           default:
3243             return false;
3244           }
3245       }
3246
3247     case INTEGER_CST:
3248       pb->eqs[eq].coef[0] += int_cst_value (access_fun);
3249       return true;
3250
3251     default:
3252       return false;
3253     }
3254 }
3255
3256 /* As explained in the comments preceding init_omega_for_ddr, we have
3257    to set up a system for each loop level, setting outer loops
3258    variation to zero, and current loop variation to positive or zero.
3259    Save each lexico positive distance vector.  */
3260
3261 static void
3262 omega_extract_distance_vectors (omega_pb pb,
3263                                 struct data_dependence_relation *ddr)
3264 {
3265   int eq, geq;
3266   unsigned i, j;
3267   struct loop *loopi, *loopj;
3268   enum omega_result res;
3269
3270   /* Set a new problem for each loop in the nest.  The basis is the
3271      problem that we have initialized until now.  On top of this we
3272      add new constraints.  */
3273   for (i = 0; i <= DDR_INNER_LOOP (ddr)
3274          && VEC_iterate (loop_p, DDR_LOOP_NEST (ddr), i, loopi); i++)
3275     {
3276       int dist = 0;
3277       omega_pb copy = omega_alloc_problem (2 * DDR_NB_LOOPS (ddr),
3278                                            DDR_NB_LOOPS (ddr));
3279
3280       omega_copy_problem (copy, pb);
3281
3282       /* For all the outer loops "loop_j", add "dj = 0".  */
3283       for (j = 0;
3284            j < i && VEC_iterate (loop_p, DDR_LOOP_NEST (ddr), j, loopj); j++)
3285         {
3286           eq = omega_add_zero_eq (copy, omega_black);
3287           copy->eqs[eq].coef[j + 1] = 1;
3288         }
3289
3290       /* For "loop_i", add "0 <= di".  */
3291       geq = omega_add_zero_geq (copy, omega_black);
3292       copy->geqs[geq].coef[i + 1] = 1;
3293
3294       /* Reduce the constraint system, and test that the current
3295          problem is feasible.  */
3296       res = omega_simplify_problem (copy);
3297       if (res == omega_false
3298           || res == omega_unknown
3299           || copy->num_geqs > (int) DDR_NB_LOOPS (ddr))
3300         goto next_problem;
3301
3302       for (eq = 0; eq < copy->num_subs; eq++)
3303         if (copy->subs[eq].key == (int) i + 1)
3304           {
3305             dist = copy->subs[eq].coef[0];
3306             goto found_dist;
3307           }
3308
3309       if (dist == 0)
3310         {
3311           /* Reinitialize problem...  */
3312           omega_copy_problem (copy, pb);
3313           for (j = 0;
3314                j < i && VEC_iterate (loop_p, DDR_LOOP_NEST (ddr), j, loopj); j++)
3315             {
3316               eq = omega_add_zero_eq (copy, omega_black);
3317               copy->eqs[eq].coef[j + 1] = 1;
3318             }
3319
3320           /* ..., but this time "di = 1".  */
3321           eq = omega_add_zero_eq (copy, omega_black);
3322           copy->eqs[eq].coef[i + 1] = 1;
3323           copy->eqs[eq].coef[0] = -1;
3324
3325           res = omega_simplify_problem (copy);
3326           if (res == omega_false
3327               || res == omega_unknown
3328               || copy->num_geqs > (int) DDR_NB_LOOPS (ddr))
3329             goto next_problem;
3330
3331           for (eq = 0; eq < copy->num_subs; eq++)
3332             if (copy->subs[eq].key == (int) i + 1)
3333               {
3334                 dist = copy->subs[eq].coef[0];
3335                 goto found_dist;
3336               }
3337         }
3338
3339     found_dist:;
3340       /* Save the lexicographically positive distance vector.  */
3341       if (dist >= 0)
3342         {
3343           lambda_vector dist_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3344           lambda_vector dir_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3345
3346           dist_v[i] = dist;
3347
3348           for (eq = 0; eq < copy->num_subs; eq++)
3349             if (copy->subs[eq].key > 0)
3350               {
3351                 dist = copy->subs[eq].coef[0];
3352                 dist_v[copy->subs[eq].key - 1] = dist;
3353               }
3354
3355           for (j = 0; j < DDR_NB_LOOPS (ddr); j++)
3356             dir_v[j] = dir_from_dist (dist_v[j]);
3357
3358           save_dist_v (ddr, dist_v);
3359           save_dir_v (ddr, dir_v);
3360         }
3361
3362     next_problem:;
3363       omega_free_problem (copy);
3364     }
3365 }
3366
3367 /* This is called for each subscript of a tuple of data references:
3368    insert an equality for representing the conflicts.  */
3369
3370 static bool
3371 omega_setup_subscript (tree access_fun_a, tree access_fun_b,
3372                        struct data_dependence_relation *ddr,
3373                        omega_pb pb, bool *maybe_dependent)
3374 {
3375   int eq;
3376   tree fun_a = chrec_convert (integer_type_node, access_fun_a, NULL_TREE);
3377   tree fun_b = chrec_convert (integer_type_node, access_fun_b, NULL_TREE);
3378   tree difference = chrec_fold_minus (integer_type_node, fun_a, fun_b);
3379
3380   /* When the fun_a - fun_b is not constant, the dependence is not
3381      captured by the classic distance vector representation.  */
3382   if (TREE_CODE (difference) != INTEGER_CST)
3383     return false;
3384
3385   /* ZIV test.  */
3386   if (ziv_subscript_p (fun_a, fun_b) && !integer_zerop (difference))
3387     {
3388       /* There is no dependence.  */
3389       *maybe_dependent = false;
3390       return true;
3391     }
3392
3393   fun_b = chrec_fold_multiply (integer_type_node, fun_b,
3394                                integer_minus_one_node);
3395
3396   eq = omega_add_zero_eq (pb, omega_black);
3397   if (!init_omega_eq_with_af (pb, eq, DDR_NB_LOOPS (ddr), fun_a, ddr)
3398       || !init_omega_eq_with_af (pb, eq, 0, fun_b, ddr))
3399     /* There is probably a dependence, but the system of
3400        constraints cannot be built: answer "don't know".  */
3401     return false;
3402
3403   /* GCD test.  */
3404   if (DDR_NB_LOOPS (ddr) != 0 && pb->eqs[eq].coef[0]
3405       && !int_divides_p (lambda_vector_gcd
3406                          ((lambda_vector) &(pb->eqs[eq].coef[1]),
3407                           2 * DDR_NB_LOOPS (ddr)),
3408                          pb->eqs[eq].coef[0]))
3409     {
3410       /* There is no dependence.  */
3411       *maybe_dependent = false;
3412       return true;
3413     }
3414
3415   return true;
3416 }
3417
3418 /* Helper function, same as init_omega_for_ddr but specialized for
3419    data references A and B.  */
3420
3421 static bool
3422 init_omega_for_ddr_1 (struct data_reference *dra, struct data_reference *drb,
3423                       struct data_dependence_relation *ddr,
3424                       omega_pb pb, bool *maybe_dependent)
3425 {
3426   unsigned i;
3427   int ineq;
3428   struct loop *loopi;
3429   unsigned nb_loops = DDR_NB_LOOPS (ddr);
3430
3431   /* Insert an equality per subscript.  */
3432   for (i = 0; i < DDR_NUM_SUBSCRIPTS (ddr); i++)
3433     {
3434       if (!omega_setup_subscript (DR_ACCESS_FN (dra, i), DR_ACCESS_FN (drb, i),
3435                                   ddr, pb, maybe_dependent))
3436         return false;
3437       else if (*maybe_dependent == false)
3438         {
3439           /* There is no dependence.  */
3440           DDR_ARE_DEPENDENT (ddr) = chrec_known;
3441           return true;
3442         }
3443     }
3444
3445   /* Insert inequalities: constraints corresponding to the iteration
3446      domain, i.e. the loops surrounding the references "loop_x" and
3447      the distance variables "dx".  The layout of the OMEGA
3448      representation is as follows:
3449      - coef[0] is the constant
3450      - coef[1..nb_loops] are the protected variables that will not be
3451      removed by the solver: the "dx"
3452      - coef[nb_loops + 1, 2*nb_loops] are the loop variables: "loop_x".
3453   */
3454   for (i = 0; i <= DDR_INNER_LOOP (ddr)
3455          && VEC_iterate (loop_p, DDR_LOOP_NEST (ddr), i, loopi); i++)
3456     {
3457       HOST_WIDE_INT nbi = estimated_loop_iterations_int (loopi, true);
3458
3459       /* 0 <= loop_x */
3460       ineq = omega_add_zero_geq (pb, omega_black);
3461       pb->geqs[ineq].coef[i + nb_loops + 1] = 1;
3462
3463       /* 0 <= loop_x + dx */
3464       ineq = omega_add_zero_geq (pb, omega_black);
3465       pb->geqs[ineq].coef[i + nb_loops + 1] = 1;
3466       pb->geqs[ineq].coef[i + 1] = 1;
3467
3468       if (nbi != -1)
3469         {
3470           /* loop_x <= nb_iters */
3471           ineq = omega_add_zero_geq (pb, omega_black);
3472           pb->geqs[ineq].coef[i + nb_loops + 1] = -1;
3473           pb->geqs[ineq].coef[0] = nbi;
3474
3475           /* loop_x + dx <= nb_iters */
3476           ineq = omega_add_zero_geq (pb, omega_black);
3477           pb->geqs[ineq].coef[i + nb_loops + 1] = -1;
3478           pb->geqs[ineq].coef[i + 1] = -1;
3479           pb->geqs[ineq].coef[0] = nbi;
3480
3481           /* A step "dx" bigger than nb_iters is not feasible, so
3482              add "0 <= nb_iters + dx",  */
3483           ineq = omega_add_zero_geq (pb, omega_black);
3484           pb->geqs[ineq].coef[i + 1] = 1;
3485           pb->geqs[ineq].coef[0] = nbi;
3486           /* and "dx <= nb_iters".  */
3487           ineq = omega_add_zero_geq (pb, omega_black);
3488           pb->geqs[ineq].coef[i + 1] = -1;
3489           pb->geqs[ineq].coef[0] = nbi;
3490         }
3491     }
3492
3493   omega_extract_distance_vectors (pb, ddr);
3494
3495   return true;
3496 }
3497
3498 /* Sets up the Omega dependence problem for the data dependence
3499    relation DDR.  Returns false when the constraint system cannot be
3500    built, ie. when the test answers "don't know".  Returns true
3501    otherwise, and when independence has been proved (using one of the
3502    trivial dependence test), set MAYBE_DEPENDENT to false, otherwise
3503    set MAYBE_DEPENDENT to true.
3504
3505    Example: for setting up the dependence system corresponding to the
3506    conflicting accesses
3507
3508    | loop_i
3509    |   loop_j
3510    |     A[i, i+1] = ...
3511    |     ... A[2*j, 2*(i + j)]
3512    |   endloop_j
3513    | endloop_i
3514
3515    the following constraints come from the iteration domain:
3516
3517    0 <= i <= Ni
3518    0 <= i + di <= Ni
3519    0 <= j <= Nj
3520    0 <= j + dj <= Nj
3521
3522    where di, dj are the distance variables.  The constraints
3523    representing the conflicting elements are:
3524
3525    i = 2 * (j + dj)
3526    i + 1 = 2 * (i + di + j + dj)
3527
3528    For asking that the resulting distance vector (di, dj) be
3529    lexicographically positive, we insert the constraint "di >= 0".  If
3530    "di = 0" in the solution, we fix that component to zero, and we
3531    look at the inner loops: we set a new problem where all the outer
3532    loop distances are zero, and fix this inner component to be
3533    positive.  When one of the components is positive, we save that
3534    distance, and set a new problem where the distance on this loop is
3535    zero, searching for other distances in the inner loops.  Here is
3536    the classic example that illustrates that we have to set for each
3537    inner loop a new problem:
3538
3539    | loop_1
3540    |   loop_2
3541    |     A[10]
3542    |   endloop_2
3543    | endloop_1
3544
3545    we have to save two distances (1, 0) and (0, 1).
3546
3547    Given two array references, refA and refB, we have to set the
3548    dependence problem twice, refA vs. refB and refB vs. refA, and we
3549    cannot do a single test, as refB might occur before refA in the
3550    inner loops, and the contrary when considering outer loops: ex.
3551
3552    | loop_0
3553    |   loop_1
3554    |     loop_2
3555    |       T[{1,+,1}_2][{1,+,1}_1]  // refA
3556    |       T[{2,+,1}_2][{0,+,1}_1]  // refB
3557    |     endloop_2
3558    |   endloop_1
3559    | endloop_0
3560
3561    refB touches the elements in T before refA, and thus for the same
3562    loop_0 refB precedes refA: ie. the distance vector (0, 1, -1)
3563    but for successive loop_0 iterations, we have (1, -1, 1)
3564
3565    The Omega solver expects the distance variables ("di" in the
3566    previous example) to come first in the constraint system (as
3567    variables to be protected, or "safe" variables), the constraint
3568    system is built using the following layout:
3569
3570    "cst | distance vars | index vars".
3571 */
3572
3573 static bool
3574 init_omega_for_ddr (struct data_dependence_relation *ddr,
3575                     bool *maybe_dependent)
3576 {
3577   omega_pb pb;
3578   bool res = false;
3579
3580   *maybe_dependent = true;
3581
3582   if (same_access_functions (ddr))
3583     {
3584       unsigned j;
3585       lambda_vector dir_v;
3586
3587       /* Save the 0 vector.  */
3588       save_dist_v (ddr, lambda_vector_new (DDR_NB_LOOPS (ddr)));
3589       dir_v = lambda_vector_new (DDR_NB_LOOPS (ddr));
3590       for (j = 0; j < DDR_NB_LOOPS (ddr); j++)
3591         dir_v[j] = dir_equal;
3592       save_dir_v (ddr, dir_v);
3593
3594       /* Save the dependences carried by outer loops.  */
3595       pb = omega_alloc_problem (2 * DDR_NB_LOOPS (ddr), DDR_NB_LOOPS (ddr));
3596       res = init_omega_for_ddr_1 (DDR_A (ddr), DDR_B (ddr), ddr, pb,
3597                                   maybe_dependent);
3598       omega_free_problem (pb);
3599       return res;
3600     }
3601
3602   /* Omega expects the protected variables (those that have to be kept
3603      after elimination) to appear first in the constraint system.
3604      These variables are the distance variables.  In the following
3605      initialization we declare NB_LOOPS safe variables, and the total
3606      number of variables for the constraint system is 2*NB_LOOPS.  */
3607   pb = omega_alloc_problem (2 * DDR_NB_LOOPS (ddr), DDR_NB_LOOPS (ddr));
3608   res = init_omega_for_ddr_1 (DDR_A (ddr), DDR_B (ddr), ddr, pb,
3609                               maybe_dependent);
3610   omega_free_problem (pb);
3611
3612   /* Stop computation if not decidable, or no dependence.  */
3613   if (res == false || *maybe_dependent == false)
3614     return res;
3615
3616   pb = omega_alloc_problem (2 * DDR_NB_LOOPS (ddr), DDR_NB_LOOPS (ddr));
3617   res = init_omega_for_ddr_1 (DDR_B (ddr), DDR_A (ddr), ddr, pb,
3618                               maybe_dependent);
3619   omega_free_problem (pb);
3620
3621   return res;
3622 }
3623
3624 /* Return true when DDR contains the same information as that stored
3625    in DIR_VECTS and in DIST_VECTS, return false otherwise.   */
3626
3627 static bool
3628 ddr_consistent_p (FILE *file,
3629                   struct data_dependence_relation *ddr,
3630                   VEC (lambda_vector, heap) *dist_vects,
3631                   VEC (lambda_vector, heap) *dir_vects)
3632 {
3633   unsigned int i, j;
3634
3635   /* If dump_file is set, output there.  */
3636   if (dump_file && (dump_flags & TDF_DETAILS))
3637     file = dump_file;
3638
3639   if (VEC_length (lambda_vector, dist_vects) != DDR_NUM_DIST_VECTS (ddr))
3640     {
3641       lambda_vector b_dist_v;
3642       fprintf (file, "\n(Number of distance vectors differ: Banerjee has %d, Omega has %d.\n",
3643                VEC_length (lambda_vector, dist_vects),
3644                DDR_NUM_DIST_VECTS (ddr));
3645
3646       fprintf (file, "Banerjee dist vectors:\n");
3647       for (i = 0; VEC_iterate (lambda_vector, dist_vects, i, b_dist_v); i++)
3648         print_lambda_vector (file, b_dist_v, DDR_NB_LOOPS (ddr));
3649
3650       fprintf (file, "Omega dist vectors:\n");
3651       for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
3652         print_lambda_vector (file, DDR_DIST_VECT (ddr, i), DDR_NB_LOOPS (ddr));
3653
3654       fprintf (file, "data dependence relation:\n");
3655       dump_data_dependence_relation (file, ddr);
3656
3657       fprintf (file, ")\n");
3658       return false;
3659     }
3660
3661   if (VEC_length (lambda_vector, dir_vects) != DDR_NUM_DIR_VECTS (ddr))
3662     {
3663       fprintf (file, "\n(Number of direction vectors differ: Banerjee has %d, Omega has %d.)\n",
3664                VEC_length (lambda_vector, dir_vects),
3665                DDR_NUM_DIR_VECTS (ddr));
3666       return false;
3667     }
3668
3669   for (i = 0; i < DDR_NUM_DIST_VECTS (ddr); i++)
3670     {
3671       lambda_vector a_dist_v;
3672       lambda_vector b_dist_v = DDR_DIST_VECT (ddr, i);
3673
3674       /* Distance vectors are not ordered in the same way in the DDR
3675          and in the DIST_VECTS: search for a matching vector.  */
3676       for (j = 0; VEC_iterate (lambda_vector, dist_vects, j, a_dist_v); j++)
3677         if (lambda_vector_equal (a_dist_v, b_dist_v, DDR_NB_LOOPS (ddr)))
3678           break;
3679
3680       if (j == VEC_length (lambda_vector, dist_vects))
3681         {
3682           fprintf (file, "\n(Dist vectors from the first dependence analyzer:\n");
3683           print_dist_vectors (file, dist_vects, DDR_NB_LOOPS (ddr));
3684           fprintf (file, "not found in Omega dist vectors:\n");
3685           print_dist_vectors (file, DDR_DIST_VECTS (ddr), DDR_NB_LOOPS (ddr));
3686           fprintf (file, "data dependence relation:\n");
3687           dump_data_dependence_relation (file, ddr);
3688           fprintf (file, ")\n");
3689         }
3690     }
3691
3692   for (i = 0; i < DDR_NUM_DIR_VECTS (ddr); i++)
3693     {
3694       lambda_vector a_dir_v;
3695       lambda_vector b_dir_v = DDR_DIR_VECT (ddr, i);
3696
3697       /* Direction vectors are not ordered in the same way in the DDR
3698          and in the DIR_VECTS: search for a matching vector.  */
3699       for (j = 0; VEC_iterate (lambda_vector, dir_vects, j, a_dir_v); j++)
3700         if (lambda_vector_equal (a_dir_v, b_dir_v, DDR_NB_LOOPS (ddr)))
3701           break;
3702
3703       if (j == VEC_length (lambda_vector, dist_vects))
3704         {
3705           fprintf (file, "\n(Dir vectors from the first dependence analyzer:\n");
3706           print_dir_vectors (file, dir_vects, DDR_NB_LOOPS (ddr));
3707           fprintf (file, "not found in Omega dir vectors:\n");
3708           print_dir_vectors (file, DDR_DIR_VECTS (ddr), DDR_NB_LOOPS (ddr));
3709           fprintf (file, "data dependence relation:\n");
3710           dump_data_dependence_relation (file, ddr);
3711           fprintf (file, ")\n");
3712         }
3713     }
3714
3715   return true;
3716 }
3717
3718 /* This computes the affine dependence relation between A and B.
3719    CHREC_KNOWN is used for representing the independence between two
3720    accesses, while CHREC_DONT_KNOW is used for representing the unknown
3721    relation.
3722
3723    Note that it is possible to stop the computation of the dependence
3724    relation the first time we detect a CHREC_KNOWN element for a given
3725    subscript.  */
3726
3727 static void
3728 compute_affine_dependence (struct data_dependence_relation *ddr)
3729 {
3730   struct data_reference *dra = DDR_A (ddr);
3731   struct data_reference *drb = DDR_B (ddr);
3732
3733   if (dump_file && (dump_flags & TDF_DETAILS))
3734     {
3735       fprintf (dump_file, "(compute_affine_dependence\n");
3736       fprintf (dump_file, "  (stmt_a = \n");
3737       print_generic_expr (dump_file, DR_STMT (dra), 0);
3738       fprintf (dump_file, ")\n  (stmt_b = \n");
3739       print_generic_expr (dump_file, DR_STMT (drb), 0);
3740       fprintf (dump_file, ")\n");
3741     }
3742
3743   /* Analyze only when the dependence relation is not yet known.  */
3744   if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
3745     {
3746       dependence_stats.num_dependence_tests++;
3747
3748       if (access_functions_are_affine_or_constant_p (dra)
3749           && access_functions_are_affine_or_constant_p (drb))
3750         {
3751           if (flag_check_data_deps)
3752             {
3753               /* Compute the dependences using the first algorithm.  */
3754               subscript_dependence_tester (ddr);
3755
3756               if (dump_file && (dump_flags & TDF_DETAILS))
3757                 {
3758                   fprintf (dump_file, "\n\nBanerjee Analyzer\n");
3759                   dump_data_dependence_relation (dump_file, ddr);
3760                 }
3761
3762               if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE)
3763                 {
3764                   bool maybe_dependent;
3765                   VEC (lambda_vector, heap) *dir_vects, *dist_vects;
3766
3767                   /* Save the result of the first DD analyzer.  */
3768                   dist_vects = DDR_DIST_VECTS (ddr);
3769                   dir_vects = DDR_DIR_VECTS (ddr);
3770
3771                   /* Reset the information.  */
3772                   DDR_DIST_VECTS (ddr) = NULL;
3773                   DDR_DIR_VECTS (ddr) = NULL;
3774
3775                   /* Compute the same information using Omega.  */
3776                   if (!init_omega_for_ddr (ddr, &maybe_dependent))
3777                     goto csys_dont_know;
3778
3779                   if (dump_file && (dump_flags & TDF_DETAILS))
3780                     {
3781                       fprintf (dump_file, "Omega Analyzer\n");
3782                       dump_data_dependence_relation (dump_file, ddr);
3783                     }
3784
3785                   /* Check that we get the same information.  */
3786                   if (maybe_dependent)
3787                     gcc_assert (ddr_consistent_p (stderr, ddr, dist_vects,
3788                                                   dir_vects));
3789                 }
3790             }
3791           else
3792             subscript_dependence_tester (ddr);
3793         }
3794
3795       /* As a last case, if the dependence cannot be determined, or if
3796          the dependence is considered too difficult to determine, answer
3797          "don't know".  */
3798       else
3799         {
3800         csys_dont_know:;
3801           dependence_stats.num_dependence_undetermined++;
3802
3803           if (dump_file && (dump_flags & TDF_DETAILS))
3804             {
3805               fprintf (dump_file, "Data ref a:\n");
3806               dump_data_reference (dump_file, dra);
3807               fprintf (dump_file, "Data ref b:\n");
3808               dump_data_reference (dump_file, drb);
3809               fprintf (dump_file, "affine dependence test not usable: access function not affine or constant.\n");
3810             }
3811           finalize_ddr_dependent (ddr, chrec_dont_know);
3812         }
3813     }
3814
3815   if (dump_file && (dump_flags & TDF_DETAILS))
3816     fprintf (dump_file, ")\n");
3817 }
3818
3819 /* This computes the dependence relation for the same data
3820    reference into DDR.  */
3821
3822 static void
3823 compute_self_dependence (struct data_dependence_relation *ddr)
3824 {
3825   unsigned int i;
3826   struct subscript *subscript;
3827
3828   if (DDR_ARE_DEPENDENT (ddr) != NULL_TREE)
3829     return;
3830
3831   for (i = 0; VEC_iterate (subscript_p, DDR_SUBSCRIPTS (ddr), i, subscript);
3832        i++)
3833     {
3834       /* The accessed index overlaps for each iteration.  */
3835       SUB_CONFLICTS_IN_A (subscript)
3836               = conflict_fn (1, affine_fn_cst (integer_zero_node));
3837       SUB_CONFLICTS_IN_B (subscript)
3838               = conflict_fn (1, affine_fn_cst (integer_zero_node));
3839       SUB_LAST_CONFLICT (subscript) = chrec_dont_know;
3840     }
3841
3842   /* The distance vector is the zero vector.  */
3843   save_dist_v (ddr, lambda_vector_new (DDR_NB_LOOPS (ddr)));
3844   save_dir_v (ddr, lambda_vector_new (DDR_NB_LOOPS (ddr)));
3845 }
3846
3847 /* Compute in DEPENDENCE_RELATIONS the data dependence graph for all
3848    the data references in DATAREFS, in the LOOP_NEST.  When
3849    COMPUTE_SELF_AND_RR is FALSE, don't compute read-read and self
3850    relations.  */
3851
3852 void
3853 compute_all_dependences (VEC (data_reference_p, heap) *datarefs,
3854                          VEC (ddr_p, heap) **dependence_relations,
3855                          VEC (loop_p, heap) *loop_nest,
3856                          bool compute_self_and_rr)
3857 {
3858   struct data_dependence_relation *ddr;
3859   struct data_reference *a, *b;
3860   unsigned int i, j;
3861
3862   for (i = 0; VEC_iterate (data_reference_p, datarefs, i, a); i++)
3863     for (j = i + 1; VEC_iterate (data_reference_p, datarefs, j, b); j++)
3864       if (!DR_IS_READ (a) || !DR_IS_READ (b) || compute_self_and_rr)
3865         {
3866           ddr = initialize_data_dependence_relation (a, b, loop_nest);
3867           VEC_safe_push (ddr_p, heap, *dependence_relations, ddr);
3868           compute_affine_dependence (ddr);
3869         }
3870
3871   if (compute_self_and_rr)
3872     for (i = 0; VEC_iterate (data_reference_p, datarefs, i, a); i++)
3873       {
3874         ddr = initialize_data_dependence_relation (a, a, loop_nest);
3875         VEC_safe_push (ddr_p, heap, *dependence_relations, ddr);
3876         compute_self_dependence (ddr);
3877       }
3878 }
3879
3880 /* Stores the locations of memory references in STMT to REFERENCES.  Returns
3881    true if STMT clobbers memory, false otherwise.  */
3882
3883 bool
3884 get_references_in_stmt (tree stmt, VEC (data_ref_loc, heap) **references)
3885 {
3886   bool clobbers_memory = false;
3887   data_ref_loc *ref;
3888   tree *op0, *op1, call;
3889
3890   *references = NULL;
3891
3892   /* ASM_EXPR and CALL_EXPR may embed arbitrary side effects.
3893      Calls have side-effects, except those to const or pure
3894      functions.  */
3895   call = get_call_expr_in (stmt);
3896   if ((call
3897        && !(call_expr_flags (call) & (ECF_CONST | ECF_PURE)))
3898       || (TREE_CODE (stmt) == ASM_EXPR
3899           && ASM_VOLATILE_P (stmt)))
3900     clobbers_memory = true;
3901
3902   if (ZERO_SSA_OPERANDS (stmt, SSA_OP_ALL_VIRTUALS))
3903     return clobbers_memory;
3904
3905   if (TREE_CODE (stmt) ==  GIMPLE_MODIFY_STMT)
3906     {
3907       op0 = &GIMPLE_STMT_OPERAND (stmt, 0);
3908       op1 = &GIMPLE_STMT_OPERAND (stmt, 1);
3909
3910       if (DECL_P (*op1)
3911           || REFERENCE_CLASS_P (*op1))
3912         {
3913           ref = VEC_safe_push (data_ref_loc, heap, *references, NULL);
3914           ref->pos = op1;
3915           ref->is_read = true;
3916         }
3917
3918       if (DECL_P (*op0)
3919           || REFERENCE_CLASS_P (*op0))
3920         {
3921           ref = VEC_safe_push (data_ref_loc, heap, *references, NULL);
3922           ref->pos = op0;
3923           ref->is_read = false;
3924         }
3925     }
3926
3927   if (call)
3928     {
3929       unsigned i, n = call_expr_nargs (call);
3930
3931       for (i = 0; i < n; i++)
3932         {
3933           op0 = &CALL_EXPR_ARG (call, i);
3934
3935           if (DECL_P (*op0)
3936               || REFERENCE_CLASS_P (*op0))
3937             {
3938               ref = VEC_safe_push (data_ref_loc, heap, *references, NULL);
3939               ref->pos = op0;
3940               ref->is_read = true;
3941             }
3942         }
3943     }
3944
3945   return clobbers_memory;
3946 }
3947
3948 /* Stores the data references in STMT to DATAREFS.  If there is an unanalyzable
3949    reference, returns false, otherwise returns true.  NEST is the outermost
3950    loop of the loop nest in that the references should be analyzed.  */
3951
3952 static bool
3953 find_data_references_in_stmt (struct loop *nest, tree stmt,
3954                               VEC (data_reference_p, heap) **datarefs)
3955 {
3956   unsigned i;
3957   VEC (data_ref_loc, heap) *references;
3958   data_ref_loc *ref;
3959   bool ret = true;
3960   data_reference_p dr;
3961
3962   if (get_references_in_stmt (stmt, &references))
3963     {
3964       VEC_free (data_ref_loc, heap, references);
3965       return false;
3966     }
3967
3968   for (i = 0; VEC_iterate (data_ref_loc, references, i, ref); i++)
3969     {
3970       dr = create_data_ref (nest, *ref->pos, stmt, ref->is_read);
3971       gcc_assert (dr != NULL);
3972
3973       /* FIXME -- data dependence analysis does not work correctly for objects with
3974          invariant addresses.  Let us fail here until the problem is fixed.  */
3975       if (dr_address_invariant_p (dr))
3976         {
3977           free_data_ref (dr);
3978           if (dump_file && (dump_flags & TDF_DETAILS))
3979             fprintf (dump_file, "\tFAILED as dr address is invariant\n");
3980           ret = false;
3981           break;
3982         }
3983
3984       VEC_safe_push (data_reference_p, heap, *datarefs, dr);
3985     }
3986   VEC_free (data_ref_loc, heap, references);
3987   return ret;
3988 }
3989
3990 /* Search the data references in LOOP, and record the information into
3991    DATAREFS.  Returns chrec_dont_know when failing to analyze a
3992    difficult case, returns NULL_TREE otherwise.
3993
3994    TODO: This function should be made smarter so that it can handle address
3995    arithmetic as if they were array accesses, etc.  */
3996
3997 static tree
3998 find_data_references_in_loop (struct loop *loop,
3999                               VEC (data_reference_p, heap) **datarefs)
4000 {
4001   basic_block bb, *bbs;
4002   unsigned int i;
4003   block_stmt_iterator bsi;
4004
4005   bbs = get_loop_body_in_dom_order (loop);
4006
4007   for (i = 0; i < loop->num_nodes; i++)
4008     {
4009       bb = bbs[i];
4010
4011       for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
4012         {
4013           tree stmt = bsi_stmt (bsi);
4014
4015           if (!find_data_references_in_stmt (loop, stmt, datarefs))
4016             {
4017               struct data_reference *res;
4018               res = XCNEW (struct data_reference);
4019               VEC_safe_push (data_reference_p, heap, *datarefs, res);
4020
4021               free (bbs);
4022               return chrec_dont_know;
4023             }
4024         }
4025     }
4026   free (bbs);
4027
4028   return NULL_TREE;
4029 }
4030
4031 /* Recursive helper function.  */
4032
4033 static bool
4034 find_loop_nest_1 (struct loop *loop, VEC (loop_p, heap) **loop_nest)
4035 {
4036   /* Inner loops of the nest should not contain siblings.  Example:
4037      when there are two consecutive loops,
4038
4039      | loop_0
4040      |   loop_1
4041      |     A[{0, +, 1}_1]
4042      |   endloop_1
4043      |   loop_2
4044      |     A[{0, +, 1}_2]
4045      |   endloop_2
4046      | endloop_0
4047
4048      the dependence relation cannot be captured by the distance
4049      abstraction.  */
4050   if (loop->next)
4051     return false;
4052
4053   VEC_safe_push (loop_p, heap, *loop_nest, loop);
4054   if (loop->inner)
4055     return find_loop_nest_1 (loop->inner, loop_nest);
4056   return true;
4057 }
4058
4059 /* Return false when the LOOP is not well nested.  Otherwise return
4060    true and insert in LOOP_NEST the loops of the nest.  LOOP_NEST will
4061    contain the loops from the outermost to the innermost, as they will
4062    appear in the classic distance vector.  */
4063
4064 bool
4065 find_loop_nest (struct loop *loop, VEC (loop_p, heap) **loop_nest)
4066 {
4067   VEC_safe_push (loop_p, heap, *loop_nest, loop);
4068   if (loop->inner)
4069     return find_loop_nest_1 (loop->inner, loop_nest);
4070   return true;
4071 }
4072
4073 /* Given a loop nest LOOP, the following vectors are returned:
4074    DATAREFS is initialized to all the array elements contained in this loop,
4075    DEPENDENCE_RELATIONS contains the relations between the data references.
4076    Compute read-read and self relations if
4077    COMPUTE_SELF_AND_READ_READ_DEPENDENCES is TRUE.  */
4078
4079 void
4080 compute_data_dependences_for_loop (struct loop *loop,
4081                                    bool compute_self_and_read_read_dependences,
4082                                    VEC (data_reference_p, heap) **datarefs,
4083                                    VEC (ddr_p, heap) **dependence_relations)
4084 {
4085   VEC (loop_p, heap) *vloops = VEC_alloc (loop_p, heap, 3);
4086
4087   memset (&dependence_stats, 0, sizeof (dependence_stats));
4088
4089   /* If the loop nest is not well formed, or one of the data references
4090      is not computable, give up without spending time to compute other
4091      dependences.  */
4092   if (!loop
4093       || !find_loop_nest (loop, &vloops)
4094       || find_data_references_in_loop (loop, datarefs) == chrec_dont_know)
4095     {
4096       struct data_dependence_relation *ddr;
4097
4098       /* Insert a single relation into dependence_relations:
4099          chrec_dont_know.  */
4100       ddr = initialize_data_dependence_relation (NULL, NULL, vloops);
4101       VEC_safe_push (ddr_p, heap, *dependence_relations, ddr);
4102     }
4103   else
4104     compute_all_dependences (*datarefs, dependence_relations, vloops,
4105                              compute_self_and_read_read_dependences);
4106
4107   if (dump_file && (dump_flags & TDF_STATS))
4108     {
4109       fprintf (dump_file, "Dependence tester statistics:\n");
4110
4111       fprintf (dump_file, "Number of dependence tests: %d\n",
4112                dependence_stats.num_dependence_tests);
4113       fprintf (dump_file, "Number of dependence tests classified dependent: %d\n",
4114                dependence_stats.num_dependence_dependent);
4115       fprintf (dump_file, "Number of dependence tests classified independent: %d\n",
4116                dependence_stats.num_dependence_independent);
4117       fprintf (dump_file, "Number of undetermined dependence tests: %d\n",
4118                dependence_stats.num_dependence_undetermined);
4119
4120       fprintf (dump_file, "Number of subscript tests: %d\n",
4121                dependence_stats.num_subscript_tests);
4122       fprintf (dump_file, "Number of undetermined subscript tests: %d\n",
4123                dependence_stats.num_subscript_undetermined);
4124       fprintf (dump_file, "Number of same subscript function: %d\n",
4125                dependence_stats.num_same_subscript_function);
4126
4127       fprintf (dump_file, "Number of ziv tests: %d\n",
4128                dependence_stats.num_ziv);
4129       fprintf (dump_file, "Number of ziv tests returning dependent: %d\n",
4130                dependence_stats.num_ziv_dependent);
4131       fprintf (dump_file, "Number of ziv tests returning independent: %d\n",
4132                dependence_stats.num_ziv_independent);
4133       fprintf (dump_file, "Number of ziv tests unimplemented: %d\n",
4134                dependence_stats.num_ziv_unimplemented);
4135
4136       fprintf (dump_file, "Number of siv tests: %d\n",
4137                dependence_stats.num_siv);
4138       fprintf (dump_file, "Number of siv tests returning dependent: %d\n",
4139                dependence_stats.num_siv_dependent);
4140       fprintf (dump_file, "Number of siv tests returning independent: %d\n",
4141                dependence_stats.num_siv_independent);
4142       fprintf (dump_file, "Number of siv tests unimplemented: %d\n",
4143                dependence_stats.num_siv_unimplemented);
4144
4145       fprintf (dump_file, "Number of miv tests: %d\n",
4146                dependence_stats.num_miv);
4147       fprintf (dump_file, "Number of miv tests returning dependent: %d\n",
4148                dependence_stats.num_miv_dependent);
4149       fprintf (dump_file, "Number of miv tests returning independent: %d\n",
4150                dependence_stats.num_miv_independent);
4151       fprintf (dump_file, "Number of miv tests unimplemented: %d\n",
4152                dependence_stats.num_miv_unimplemented);
4153     }
4154 }
4155
4156 /* Entry point (for testing only).  Analyze all the data references
4157    and the dependence relations in LOOP.
4158
4159    The data references are computed first.
4160
4161    A relation on these nodes is represented by a complete graph.  Some
4162    of the relations could be of no interest, thus the relations can be
4163    computed on demand.
4164
4165    In the following function we compute all the relations.  This is
4166    just a first implementation that is here for:
4167    - for showing how to ask for the dependence relations,
4168    - for the debugging the whole dependence graph,
4169    - for the dejagnu testcases and maintenance.
4170
4171    It is possible to ask only for a part of the graph, avoiding to
4172    compute the whole dependence graph.  The computed dependences are
4173    stored in a knowledge base (KB) such that later queries don't
4174    recompute the same information.  The implementation of this KB is
4175    transparent to the optimizer, and thus the KB can be changed with a
4176    more efficient implementation, or the KB could be disabled.  */
4177 static void
4178 analyze_all_data_dependences (struct loop *loop)
4179 {
4180   unsigned int i;
4181   int nb_data_refs = 10;
4182   VEC (data_reference_p, heap) *datarefs =
4183     VEC_alloc (data_reference_p, heap, nb_data_refs);
4184   VEC (ddr_p, heap) *dependence_relations =
4185     VEC_alloc (ddr_p, heap, nb_data_refs * nb_data_refs);
4186
4187   /* Compute DDs on the whole function.  */
4188   compute_data_dependences_for_loop (loop, false, &datarefs,
4189                                      &dependence_relations);
4190
4191   if (dump_file)
4192     {
4193       dump_data_dependence_relations (dump_file, dependence_relations);
4194       fprintf (dump_file, "\n\n");
4195
4196       if (dump_flags & TDF_DETAILS)
4197         dump_dist_dir_vectors (dump_file, dependence_relations);
4198
4199       if (dump_flags & TDF_STATS)
4200         {
4201           unsigned nb_top_relations = 0;
4202           unsigned nb_bot_relations = 0;
4203           unsigned nb_basename_differ = 0;
4204           unsigned nb_chrec_relations = 0;
4205           struct data_dependence_relation *ddr;
4206
4207           for (i = 0; VEC_iterate (ddr_p, dependence_relations, i, ddr); i++)
4208             {
4209               if (chrec_contains_undetermined (DDR_ARE_DEPENDENT (ddr)))
4210                 nb_top_relations++;
4211
4212               else if (DDR_ARE_DEPENDENT (ddr) == chrec_known)
4213                 {
4214                   struct data_reference *a = DDR_A (ddr);
4215                   struct data_reference *b = DDR_B (ddr);
4216
4217                   if (!bitmap_intersect_p (DR_VOPS (a), DR_VOPS (b)))
4218                     nb_basename_differ++;
4219                   else
4220                     nb_bot_relations++;
4221                 }
4222
4223               else
4224                 nb_chrec_relations++;
4225             }
4226
4227           gather_stats_on_scev_database ();
4228         }
4229     }
4230
4231   free_dependence_relations (dependence_relations);
4232   free_data_refs (datarefs);
4233 }
4234
4235 /* Computes all the data dependences and check that the results of
4236    several analyzers are the same.  */
4237
4238 void
4239 tree_check_data_deps (void)
4240 {
4241   loop_iterator li;
4242   struct loop *loop_nest;
4243
4244   FOR_EACH_LOOP (li, loop_nest, 0)
4245     analyze_all_data_dependences (loop_nest);
4246 }
4247
4248 /* Free the memory used by a data dependence relation DDR.  */
4249
4250 void
4251 free_dependence_relation (struct data_dependence_relation *ddr)
4252 {
4253   if (ddr == NULL)
4254     return;
4255
4256   if (DDR_ARE_DEPENDENT (ddr) == NULL_TREE && DDR_SUBSCRIPTS (ddr))
4257     free_subscripts (DDR_SUBSCRIPTS (ddr));
4258
4259   free (ddr);
4260 }
4261
4262 /* Free the memory used by the data dependence relations from
4263    DEPENDENCE_RELATIONS.  */
4264
4265 void
4266 free_dependence_relations (VEC (ddr_p, heap) *dependence_relations)
4267 {
4268   unsigned int i;
4269   struct data_dependence_relation *ddr;
4270   VEC (loop_p, heap) *loop_nest = NULL;
4271
4272   for (i = 0; VEC_iterate (ddr_p, dependence_relations, i, ddr); i++)
4273     {
4274       if (ddr == NULL)
4275         continue;
4276       if (loop_nest == NULL)
4277         loop_nest = DDR_LOOP_NEST (ddr);
4278       else
4279         gcc_assert (DDR_LOOP_NEST (ddr) == NULL
4280                     || DDR_LOOP_NEST (ddr) == loop_nest);
4281       free_dependence_relation (ddr);
4282     }
4283
4284   if (loop_nest)
4285     VEC_free (loop_p, heap, loop_nest);
4286   VEC_free (ddr_p, heap, dependence_relations);
4287 }
4288
4289 /* Free the memory used by the data references from DATAREFS.  */
4290
4291 void
4292 free_data_refs (VEC (data_reference_p, heap) *datarefs)
4293 {
4294   unsigned int i;
4295   struct data_reference *dr;
4296
4297   for (i = 0; VEC_iterate (data_reference_p, datarefs, i, dr); i++)
4298     free_data_ref (dr);
4299   VEC_free (data_reference_p, heap, datarefs);
4300 }
4301