gcc/ssa.c

   1 /* Static Single Assignment conversion routines for the GNU compiler.
   2    Copyright (C) 2000 Free Software Foundation, Inc.
   3
   4 This file is part of GNU CC.
   5
   6 GNU CC is free software; you can redistribute it and/or modify it
   7 under the terms of the GNU General Public License as published by the
   8 Free Software Foundation; either version 2, or (at your option) any
   9 later version.
  10
  11 GNU CC is distributed in the hope that it will be useful, but WITHOUT
  12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GNU CC; see the file COPYING.  If not, write to the Free
  18 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  19 02111-1307, USA.  */
  20
  21 /* References:
  22
  23    Building an Optimizing Compiler
  24    Robert Morgan
  25    Butterworth-Heinemann, 1998
  26
  27    Static Single Assignment Construction
  28    Preston Briggs, Tim Harvey, Taylor Simpson
  29    Technical Report, Rice University, 1995
  30    ftp://ftp.cs.rice.edu/public/preston/optimizer/SSA.ps.gz
  31 */
  32
  33 #include "config.h"
  34 #include "system.h"
  35
  36 #include "rtl.h"
  37 #include "regs.h"
  38 #include "hard-reg-set.h"
  39 #include "flags.h"
  40 #include "function.h"
  41 #include "real.h"
  42 #include "insn-config.h"
  43 #include "recog.h"
  44 #include "basic-block.h"
  45 #include "output.h"
  46 #include "partition.h"
  47
  48
  49 /* TODO:
  50
  51    Handle subregs better, maybe.  For now, if a reg that's set in a
  52    subreg expression is duplicated going into SSA form, an extra copy
  53    is inserted first that copies the entire reg into the duplicate, so
  54    that the other bits are preserved.  This isn't strictly SSA, since
  55    at least part of the reg is assigned in more than one place (though
  56    they are adjacent).
  57
  58    ??? What to do about strict_low_part.  Probably I'll have to split
  59    them out of their current instructions first thing.
  60
  61    Actually the best solution may be to have a kind of "mid-level rtl"
  62    in which the RTL encodes exactly what we want, without exposing a
  63    lot of niggling processor details.  At some later point we lower
  64    the representation, calling back into optabs to finish any necessary
  65    expansion.  */
  66
  67
  68 /* If conservative_reg_partition is non-zero, use a conservative
  69    register partitioning algorithm (which leaves more regs after
  70    emerging from SSA) instead of the coalescing one.  This is being
  71    left in for a limited time only, as a debugging tool until the
  72    coalescing algorithm is validated.  */
  73 static int conservative_reg_partition;
  74
  75 /* This flag is set when the CFG is in SSA form.  */
  76 int in_ssa_form = 0;
  77
  78 /* Element I is the single instruction that sets register I+PSEUDO.  */
  79 varray_type ssa_definition;
  80
  81 /* Element I is an INSN_LIST of instructions that use register I+PSEUDO.  */
  82 varray_type ssa_uses;
  83
  84 /* Element I-PSEUDO is the normal register that originated the ssa
  85    register in question.  */
  86 varray_type ssa_rename_from;
  87
  88 /* The running target ssa register for a given normal register.  */
  89 static rtx *ssa_rename_to;
  90
  91 /* The number of registers that were live on entry to the SSA routines.  */
  92 static unsigned int ssa_max_reg_num;
  93
  94 /* Local function prototypes.  */
  95
  96 static inline rtx * phi_alternative
  97   PARAMS ((rtx, int));
  98
  99 static int remove_phi_alternative
 100   PARAMS ((rtx, int));
 101 static void simplify_to_immediate_dominators
 102   PARAMS ((int *idom, sbitmap *dominators));
 103 static void compute_dominance_frontiers_1
 104   PARAMS ((sbitmap *frontiers, int *idom, int bb, sbitmap done));
 105 static void compute_dominance_frontiers
 106   PARAMS ((sbitmap *frontiers, int *idom));
 107 static void find_evaluations_1
 108   PARAMS ((rtx dest, rtx set, void *data));
 109 static void find_evaluations
 110   PARAMS ((sbitmap *evals, int nregs));
 111 static void compute_iterated_dominance_frontiers
 112   PARAMS ((sbitmap *idfs, sbitmap *frontiers, sbitmap *evals, int nregs));
 113 static void insert_phi_node
 114   PARAMS ((int regno, int b));
 115 static void insert_phi_nodes
 116   PARAMS ((sbitmap *idfs, sbitmap *evals, int nregs));
 117 static int rename_insn_1
 118   PARAMS ((rtx *ptr, void *data));
 119 static void rename_block
 120   PARAMS ((int b, int *idom));
 121 static void rename_registers
 122   PARAMS ((int nregs, int *idom));
 123
 124 static inline int ephi_add_node
 125   PARAMS ((rtx reg, rtx *nodes, int *n_nodes));
 126 static int * ephi_forward
 127   PARAMS ((int t, sbitmap visited, sbitmap *succ, int *tstack));
 128 static void ephi_backward
 129   PARAMS ((int t, sbitmap visited, sbitmap *pred, rtx *nodes));
 130 static void ephi_create
 131   PARAMS ((int t, sbitmap visited, sbitmap *pred, sbitmap *succ, rtx *nodes));
 132 static void eliminate_phi
 133   PARAMS ((edge e, partition reg_partition));
 134 static int make_regs_equivalent_over_bad_edges
 135   PARAMS ((int bb, partition reg_partition));
 136
 137 /* These are used only in the conservative register partitioning
 138    algorithms.  */
 139 static int make_equivalent_phi_alternatives_equivalent
 140   PARAMS ((int bb, partition reg_partition));
 141 static partition compute_conservative_reg_partition
 142   PARAMS ((void));
 143 static int rename_equivalent_regs_in_insn
 144   PARAMS ((rtx *ptr, void *data));
 145
 146 /* These are used in the register coalescing algorithm.  */
 147 static int coalesce_if_unconflicting
 148   PARAMS ((partition p, conflict_graph conflicts, int reg1, int reg2));
 149 static int coalesce_regs_in_copies
 150   PARAMS ((int bb, partition p, conflict_graph conflicts));
 151 static int coalesce_reg_in_phi
 152   PARAMS ((rtx, int dest_regno, int src_regno, void *data));
 153 static int coalesce_regs_in_successor_phi_nodes
 154   PARAMS ((int bb, partition p, conflict_graph conflicts));
 155 static partition compute_coalesced_reg_partition
 156   PARAMS (());
 157 static int mark_reg_in_phi
 158   PARAMS ((rtx *ptr, void *data));
 159 static void mark_phi_and_copy_regs
 160   PARAMS ((regset phi_set));
 161
 162 static int rename_equivalent_regs_in_insn
 163   PARAMS ((rtx *ptr, void *data));
 164 static void rename_equivalent_regs
 165   PARAMS ((partition reg_partition));
 166
 167
 168 /* Given the SET of a PHI node, return the address of the alternative
 169    for predecessor block C.  */
 170
 171 static inline rtx *
 172 phi_alternative (set, c)
 173      rtx set;
 174      int c;
 175 {
 176   rtvec phi_vec = XVEC (SET_SRC (set), 0);
 177   int v;
 178
 179   for (v = GET_NUM_ELEM (phi_vec) - 2; v >= 0; v -= 2)
 180     if (INTVAL (RTVEC_ELT (phi_vec, v + 1)) == c)
 181       return &RTVEC_ELT (phi_vec, v);
 182
 183   return NULL;
 184 }
 185
 186 /* Given the SET of a phi node, remove the alternative for predecessor
 187    block C.  Return non-zero on success, or zero if no alternative is
 188    found for C.  */
 189
 190 static int
 191 remove_phi_alternative (set, c)
 192      rtx set;
 193      int c;
 194 {
 195   rtvec phi_vec = XVEC (SET_SRC (set), 0);
 196   int num_elem = GET_NUM_ELEM (phi_vec);
 197   int v;
 198
 199   for (v = num_elem - 2; v >= 0; v -= 2)
 200     if (INTVAL (RTVEC_ELT (phi_vec, v + 1)) == c)
 201       {
 202         if (v < num_elem - 2)
 203           {
 204             RTVEC_ELT (phi_vec, v) = RTVEC_ELT (phi_vec, num_elem - 2);
 205             RTVEC_ELT (phi_vec, v + 1) = RTVEC_ELT (phi_vec, num_elem - 1);
 206           }
 207         PUT_NUM_ELEM (phi_vec, num_elem - 2);
 208         return 1;
 209       }
 210
 211   return 0;
 212 }
 213
 214 /* Computing the Immediate Dominators:
 215
 216    Throughout, we don't actually want the full dominators set as
 217    calculated by flow, but rather the immediate dominators.
 218 */
 219
 220 static void
 221 simplify_to_immediate_dominators (idom, dominators)
 222      int *idom;
 223      sbitmap *dominators;
 224 {
 225   sbitmap *tmp;
 226   int b;
 227
 228   tmp = sbitmap_vector_alloc (n_basic_blocks, n_basic_blocks);
 229
 230   /* Begin with tmp(n) = dom(n) - { n }.  */
 231   for (b = n_basic_blocks; --b >= 0; )
 232     {
 233       sbitmap_copy (tmp[b], dominators[b]);
 234       RESET_BIT (tmp[b], b);
 235     }
 236
 237   /* Subtract out all of our dominator's dominators.  */
 238   for (b = n_basic_blocks; --b >= 0; )
 239     {
 240       sbitmap tmp_b = tmp[b];
 241       int s;
 242
 243       for (s = n_basic_blocks; --s >= 0; )
 244         if (TEST_BIT (tmp_b, s))
 245           sbitmap_difference (tmp_b, tmp_b, tmp[s]);
 246     }
 247
 248   /* Find the one bit set in the bitmap and put it in the output array.  */
 249   for (b = n_basic_blocks; --b >= 0; )
 250     {
 251       int t;
 252       EXECUTE_IF_SET_IN_SBITMAP (tmp[b], 0, t, { idom[b] = t; });
 253     }
 254
 255   sbitmap_vector_free (tmp);
 256 }
 257
 258
 259 /* For all registers, find all blocks in which they are set.
 260
 261    This is the transform of what would be local kill information that
 262    we ought to be getting from flow.  */
 263
 264 static sbitmap *fe_evals;
 265 static int fe_current_bb;
 266
 267 static void
 268 find_evaluations_1 (dest, set, data)
 269      rtx dest;
 270      rtx set ATTRIBUTE_UNUSED;
 271      void *data ATTRIBUTE_UNUSED;
 272 {
 273   if (GET_CODE (dest) == REG
 274       && REGNO (dest) >= FIRST_PSEUDO_REGISTER)
 275     SET_BIT (fe_evals[REGNO (dest) - FIRST_PSEUDO_REGISTER], fe_current_bb);
 276 }
 277
 278 static void
 279 find_evaluations (evals, nregs)
 280      sbitmap *evals;
 281      int nregs;
 282 {
 283   int bb;
 284
 285   sbitmap_vector_zero (evals, nregs);
 286   fe_evals = evals;
 287
 288   for (bb = n_basic_blocks; --bb >= 0; )
 289     {
 290       rtx p, last;
 291
 292       fe_current_bb = bb;
 293       p = BLOCK_HEAD (bb);
 294       last = BLOCK_END (bb);
 295       while (1)
 296         {
 297           if (GET_RTX_CLASS (GET_CODE (p)) == 'i')
 298             note_stores (PATTERN (p), find_evaluations_1, NULL);
 299
 300           if (p == last)
 301             break;
 302           p = NEXT_INSN (p);
 303         }
 304     }
 305 }
 306
 307
 308 /* Computing the Dominance Frontier:
 309
 310    As decribed in Morgan, section 3.5, this may be done simply by
 311    walking the dominator tree bottom-up, computing the frontier for
 312    the children before the parent.  When considering a block B,
 313    there are two cases:
 314
 315    (1) A flow graph edge leaving B that does not lead to a child
 316    of B in the dominator tree must be a block that is either equal
 317    to B or not dominated by B.  Such blocks belong in the frontier
 318    of B.
 319
 320    (2) Consider a block X in the frontier of one of the children C
 321    of B.  If X is not equal to B and is not dominated by B, it
 322    is in the frontier of B.
 323 */
 324
 325 static void
 326 compute_dominance_frontiers_1 (frontiers, idom, bb, done)
 327      sbitmap *frontiers;
 328      int *idom;
 329      int bb;
 330      sbitmap done;
 331 {
 332   basic_block b = BASIC_BLOCK (bb);
 333   edge e;
 334   int c;
 335
 336   SET_BIT (done, bb);
 337   sbitmap_zero (frontiers[bb]);
 338
 339   /* Do the frontier of the children first.  Not all children in the
 340      dominator tree (blocks dominated by this one) are children in the
 341      CFG, so check all blocks.  */
 342   for (c = 0; c < n_basic_blocks; ++c)
 343     if (idom[c] == bb && ! TEST_BIT (done, c))
 344       compute_dominance_frontiers_1 (frontiers, idom, c, done);
 345
 346   /* Find blocks conforming to rule (1) above.  */
 347   for (e = b->succ; e; e = e->succ_next)
 348     {
 349       if (e->dest == EXIT_BLOCK_PTR)
 350         continue;
 351       if (idom[e->dest->index] != bb)
 352         SET_BIT (frontiers[bb], e->dest->index);
 353     }
 354
 355   /* Find blocks conforming to rule (2).  */
 356   for (c = 0; c < n_basic_blocks; ++c)
 357     if (idom[c] == bb)
 358       {
 359         int x;
 360         EXECUTE_IF_SET_IN_SBITMAP (frontiers[c], 0, x,
 361           {
 362             if (idom[x] != bb)
 363               SET_BIT (frontiers[bb], x);
 364           });
 365       }
 366 }
 367
 368 static void
 369 compute_dominance_frontiers (frontiers, idom)
 370      sbitmap *frontiers;
 371      int *idom;
 372 {
 373   sbitmap done = sbitmap_alloc (n_basic_blocks);
 374   sbitmap_zero (done);
 375
 376   compute_dominance_frontiers_1 (frontiers, idom, 0, done);
 377
 378   sbitmap_free (done);
 379 }
 380
 381
 382 /* Computing the Iterated Dominance Frontier:
 383
 384    This is the set of merge points for a given register.
 385
 386    This is not particularly intuitive.  See section 7.1 of Morgan, in
 387    particular figures 7.3 and 7.4 and the immediately surrounding text.
 388 */
 389
 390 static void
 391 compute_iterated_dominance_frontiers (idfs, frontiers, evals, nregs)
 392      sbitmap *idfs;
 393      sbitmap *frontiers;
 394      sbitmap *evals;
 395      int nregs;
 396 {
 397   sbitmap worklist;
 398   int reg, passes = 0;
 399
 400   worklist = sbitmap_alloc (n_basic_blocks);
 401
 402   for (reg = 0; reg < nregs; ++reg)
 403     {
 404       sbitmap idf = idfs[reg];
 405       int b, changed;
 406
 407       /* Start the iterative process by considering those blocks that
 408          evaluate REG.  We'll add their dominance frontiers to the
 409          IDF, and then consider the blocks we just added.  */
 410       sbitmap_copy (worklist, evals[reg]);
 411
 412       /* Morgan's algorithm is incorrect here.  Blocks that evaluate
 413          REG aren't necessarily in REG's IDF.  Start with an empty IDF.  */
 414       sbitmap_zero (idf);
 415
 416       /* Iterate until the worklist is empty.  */
 417       do
 418         {
 419           changed = 0;
 420           passes++;
 421           EXECUTE_IF_SET_IN_SBITMAP (worklist, 0, b,
 422             {
 423               RESET_BIT (worklist, b);
 424               /* For each block on the worklist, add to the IDF all
 425                  blocks on its dominance frontier that aren't already
 426                  on the IDF.  Every block that's added is also added
 427                  to the worklist.  */
 428               sbitmap_union_of_diff (worklist, worklist, frontiers[b], idf);
 429               sbitmap_a_or_b (idf, idf, frontiers[b]);
 430               changed = 1;
 431             });
 432         }
 433       while (changed);
 434     }
 435
 436   sbitmap_free (worklist);
 437
 438   if (rtl_dump_file)
 439     {
 440       fprintf(rtl_dump_file,
 441               "Iterated dominance frontier: %d passes on %d regs.\n",
 442               passes, nregs);
 443     }
 444 }
 445
 446
 447 /* Insert the phi nodes.  */
 448
 449 static void
 450 insert_phi_node (regno, bb)
 451      int regno, bb;
 452 {
 453   basic_block b = BASIC_BLOCK (bb);
 454   edge e;
 455   int npred, i;
 456   rtvec vec;
 457   rtx phi, reg;
 458
 459   /* Find out how many predecessors there are.  */
 460   for (e = b->pred, npred = 0; e; e = e->pred_next)
 461     if (e->src != ENTRY_BLOCK_PTR)
 462       npred++;
 463
 464   /* If this block has no "interesting" preds, then there is nothing to
 465      do.  Consider a block that only has the entry block as a pred.  */
 466   if (npred == 0)
 467     return;
 468
 469   /* This is the register to which the phi function will be assinged.  */
 470   reg = regno_reg_rtx[regno + FIRST_PSEUDO_REGISTER];
 471
 472   /* Construct the arguments to the PHI node.  The use of pc_rtx is just
 473      a placeholder; we'll insert the proper value in rename_registers.  */
 474   vec = rtvec_alloc (npred * 2);
 475   for (e = b->pred, i = 0; e ; e = e->pred_next, i += 2)
 476     if (e->src != ENTRY_BLOCK_PTR)
 477       {
 478         RTVEC_ELT (vec, i + 0) = pc_rtx;
 479         RTVEC_ELT (vec, i + 1) = GEN_INT (e->src->index);
 480       }
 481
 482   phi = gen_rtx_PHI (VOIDmode, vec);
 483   phi = gen_rtx_SET (VOIDmode, reg, phi);
 484
 485   if (GET_CODE (b->head) == CODE_LABEL)
 486     emit_insn_after (phi, b->head);
 487   else
 488     b->head = emit_insn_before (phi, b->head);
 489 }
 490
 491
 492 static void
 493 insert_phi_nodes (idfs, evals, nregs)
 494      sbitmap *idfs;
 495      sbitmap *evals ATTRIBUTE_UNUSED;
 496      int nregs;
 497 {
 498   int reg;
 499
 500   for (reg = 0; reg < nregs; ++reg)
 501     {
 502       int b;
 503       EXECUTE_IF_SET_IN_SBITMAP (idfs[reg], 0, b,
 504         {
 505           if (REGNO_REG_SET_P (BASIC_BLOCK (b)->global_live_at_start,
 506                                reg + FIRST_PSEUDO_REGISTER))
 507             insert_phi_node (reg, b);
 508         });
 509     }
 510 }
 511
 512 /* Rename the registers to conform to SSA.
 513
 514    This is essentially the algorithm presented in Figure 7.8 of Morgan,
 515    with a few changes to reduce pattern search time in favour of a bit
 516    more memory usage.  */
 517
 518
 519 /* One of these is created for each set.  It will live in a list local
 520    to its basic block for the duration of that block's processing.  */
 521 struct rename_set_data
 522 {
 523   struct rename_set_data *next;
 524   rtx *reg_loc;
 525   rtx set_dest;
 526   rtx new_reg;
 527   rtx prev_reg;
 528   rtx set_insn;
 529 };
 530
 531 /* This struct is used to pass information to callback functions while
 532    renaming registers.  */
 533 struct rename_context
 534 {
 535   struct rename_set_data *set_data;
 536   rtx current_insn;
 537 };
 538
 539 static void new_registers_for_updates
 540   PARAMS ((struct rename_set_data *set_data,
 541            struct rename_set_data *old_set_data, rtx insn));
 542
 543 /* This is part of a rather ugly hack to allow the pre-ssa regno to be
 544    reused.  If, during processing, a register has not yet been touched,
 545    ssa_rename_to[regno] will be NULL.  Now, in the course of pushing
 546    and popping values from ssa_rename_to, when we would ordinarily
 547    pop NULL back in, we pop RENAME_NO_RTX.  We treat this exactly the
 548    same as NULL, except that it signals that the original regno has
 549    already been reused.  */
 550 #define RENAME_NO_RTX  pc_rtx
 551
 552 /* Part one of the first step of rename_block, called through for_each_rtx.
 553    Mark pseudos that are set for later update.  Transform uses of pseudos.  */
 554
 555 static int
 556 rename_insn_1 (ptr, data)
 557      rtx *ptr;
 558      void *data;
 559 {
 560   rtx x = *ptr;
 561   struct rename_context *context = data;
 562   struct rename_set_data **set_datap = &(context->set_data);
 563
 564   if (x == NULL_RTX)
 565     return 0;
 566
 567   switch (GET_CODE (x))
 568     {
 569     case SET:
 570       {
 571         rtx *destp = &SET_DEST (x);
 572         rtx dest = SET_DEST (x);
 573
 574         /* Subregs at word 0 are interesting.  Subregs at word != 0 are
 575            presumed to be part of a contiguous multi-word set sequence.  */
 576         while (GET_CODE (dest) == SUBREG
 577                && SUBREG_WORD (dest) == 0)
 578           {
 579             destp = &SUBREG_REG (dest);
 580             dest = SUBREG_REG (dest);
 581           }
 582
 583         if (GET_CODE (dest) == REG
 584             && REGNO (dest) >= FIRST_PSEUDO_REGISTER)
 585           {
 586             /* We found a genuine set of an interesting register.  Tag
 587                it so that we can create a new name for it after we finish
 588                processing this insn.  */
 589
 590             struct rename_set_data *r;
 591             r = (struct rename_set_data *) xmalloc (sizeof(*r));
 592
 593             r->reg_loc = destp;
 594             r->set_dest = SET_DEST (x);
 595             r->set_insn = context->current_insn;
 596             r->next = *set_datap;
 597             *set_datap = r;
 598
 599             /* Since we do not wish to (directly) traverse the
 600                SET_DEST, recurse through for_each_rtx for the SET_SRC
 601                and return.  */
 602             for_each_rtx (&SET_SRC (x), rename_insn_1, data);
 603             return -1;
 604           }
 605
 606         /* Otherwise, this was not an interesting destination.  Continue
 607            on, marking uses as normal.  */
 608         return 0;
 609       }
 610
 611     case REG:
 612       if (REGNO (x) >= FIRST_PSEUDO_REGISTER
 613           && REGNO (x) < ssa_max_reg_num)
 614         {
 615           rtx new_reg = ssa_rename_to[REGNO(x) - FIRST_PSEUDO_REGISTER];
 616
 617           if (new_reg != NULL_RTX && new_reg != RENAME_NO_RTX)
 618             {
 619               if (GET_MODE (x) != GET_MODE (new_reg))
 620                 abort ();
 621               *ptr = new_reg;
 622             }
 623           /* Else this is a use before a set.  Warn?  */
 624         }
 625       return -1;
 626
 627     case PHI:
 628       /* Never muck with the phi.  We do that elsewhere, special-like.  */
 629       return -1;
 630
 631     default:
 632       /* Anything else, continue traversing.  */
 633       return 0;
 634     }
 635 }
 636
 637 /* Second part of the first step of rename_block.  The portion of the list
 638    beginning at SET_DATA through OLD_SET_DATA contain the sets present in
 639    INSN.  Update data structures accordingly.  */
 640
 641 static void
 642 new_registers_for_updates (set_data, old_set_data, insn)
 643      struct rename_set_data *set_data, *old_set_data;
 644      rtx insn;
 645 {
 646   while (set_data != old_set_data)
 647     {
 648       int regno, new_regno;
 649       rtx old_reg, new_reg, prev_reg;
 650
 651       old_reg = *set_data->reg_loc;
 652       regno = REGNO (*set_data->reg_loc);
 653
 654       /* For the first set we come across, reuse the original regno.  */
 655       if (ssa_rename_to[regno - FIRST_PSEUDO_REGISTER] == NULL_RTX)
 656         {
 657           new_reg = old_reg;
 658           prev_reg = RENAME_NO_RTX;
 659         }
 660       else
 661         {
 662           prev_reg = ssa_rename_to[regno - FIRST_PSEUDO_REGISTER];
 663           new_reg = gen_reg_rtx (GET_MODE (old_reg));
 664         }
 665
 666       set_data->new_reg = new_reg;
 667       set_data->prev_reg = prev_reg;
 668       new_regno = REGNO (new_reg);
 669       ssa_rename_to[regno - FIRST_PSEUDO_REGISTER] = new_reg;
 670
 671       if (new_regno >= (int) ssa_definition->num_elements)
 672         {
 673           int new_limit = new_regno * 5 / 4;
 674           ssa_definition = VARRAY_GROW (ssa_definition, new_limit);
 675           ssa_uses = VARRAY_GROW (ssa_uses, new_limit);
 676           ssa_rename_from = VARRAY_GROW (ssa_rename_from, new_limit);
 677         }
 678
 679       VARRAY_RTX (ssa_definition, new_regno) = insn;
 680       VARRAY_RTX (ssa_rename_from, new_regno) = old_reg;
 681
 682       set_data = set_data->next;
 683     }
 684 }
 685
 686 static void
 687 rename_block (bb, idom)
 688      int bb;
 689      int *idom;
 690 {
 691   basic_block b = BASIC_BLOCK (bb);
 692   edge e;
 693   rtx insn, next, last;
 694   struct rename_set_data *set_data = NULL;
 695   int c;
 696
 697   /* Step One: Walk the basic block, adding new names for sets and
 698      replacing uses.  */
 699
 700   next = b->head;
 701   last = b->end;
 702   do
 703     {
 704       insn = next;
 705       if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
 706         {
 707           struct rename_context context;
 708           context.set_data = set_data;
 709           context.current_insn = insn;
 710
 711           for_each_rtx (&PATTERN (insn), rename_insn_1, &context);
 712           for_each_rtx (&REG_NOTES (insn), rename_insn_1, &context);
 713
 714           new_registers_for_updates (context.set_data, set_data, insn);
 715           set_data = context.set_data;
 716         }
 717
 718       next = NEXT_INSN (insn);
 719     }
 720   while (insn != last);
 721
 722   /* Step Two: Update the phi nodes of this block's successors.  */
 723
 724   for (e = b->succ; e; e = e->succ_next)
 725     {
 726       if (e->dest == EXIT_BLOCK_PTR)
 727         continue;
 728
 729       insn = e->dest->head;
 730       if (GET_CODE (insn) == CODE_LABEL)
 731         insn = NEXT_INSN (insn);
 732
 733       while (PHI_NODE_P (insn))
 734         {
 735           rtx phi = PATTERN (insn);
 736           unsigned int regno;
 737           rtx reg;
 738
 739           /* Find out which of our outgoing registers this node is
 740              indended to replace.  Note that if this not the first PHI
 741              node to have been created for this register, we have to
 742              jump through rename links to figure out which register
 743              we're talking about.  This can easily be recognized by
 744              noting that the regno is new to this pass.  */
 745           regno = REGNO (SET_DEST (phi));
 746           if (regno >= ssa_max_reg_num)
 747             regno = REGNO (VARRAY_RTX (ssa_rename_from, regno));
 748           reg = ssa_rename_to[regno - FIRST_PSEUDO_REGISTER];
 749
 750           /* It is possible for the variable to be uninitialized on
 751              edges in.  Reduce the arity of the PHI so that we don't
 752              consider those edges.  */
 753           if (reg == NULL || reg == RENAME_NO_RTX)
 754             {
 755               if (! remove_phi_alternative (phi, bb))
 756                 abort ();
 757             }
 758           else
 759             {
 760               /* When we created the PHI nodes, we did not know what mode
 761              the register should be.  Now that we've found an original,
 762              we can fill that in.  */
 763               if (GET_MODE (SET_DEST (phi)) == VOIDmode)
 764                 PUT_MODE (SET_DEST (phi), GET_MODE (reg));
 765               else if (GET_MODE (SET_DEST (phi)) != GET_MODE (reg))
 766                 abort();
 767
 768               *phi_alternative (phi, bb) = reg;
 769               /* ??? Mark for a new ssa_uses entry.  */
 770             }
 771
 772           insn = NEXT_INSN (insn);
 773         }
 774     }
 775
 776   /* Step Three: Do the same to the children of this block in
 777      dominator order.  */
 778
 779   for (c = 0; c < n_basic_blocks; ++c)
 780     if (idom[c] == bb)
 781       rename_block (c, idom);
 782
 783   /* Step Four: Update the sets to refer to their new register.  */
 784
 785   while (set_data)
 786     {
 787       struct rename_set_data *next;
 788       rtx old_reg = *set_data->reg_loc;
 789
 790       /* If the set is of a subreg only, copy the entire reg first so
 791          that unmodified bits are preserved.  Of course, we don't
 792          strictly have SSA any more, but that's the best we can do
 793          without a lot of hard work.  */
 794
 795       if (GET_CODE (set_data->set_dest) == SUBREG)
 796         {
 797           if (old_reg != set_data->new_reg)
 798             {
 799               rtx copy = gen_rtx_SET (GET_MODE (old_reg),
 800                                       set_data->new_reg, old_reg);
 801               emit_insn_before (copy, set_data->set_insn);
 802             }
 803         }
 804
 805       *set_data->reg_loc = set_data->new_reg;
 806       ssa_rename_to[REGNO (old_reg)-FIRST_PSEUDO_REGISTER]
 807         = set_data->prev_reg;
 808
 809       next = set_data->next;
 810       free (set_data);
 811       set_data = next;
 812     }
 813 }
 814
 815 static void
 816 rename_registers (nregs, idom)
 817      int nregs;
 818      int *idom;
 819 {
 820   VARRAY_RTX_INIT (ssa_definition, nregs * 3, "ssa_definition");
 821   VARRAY_RTX_INIT (ssa_uses, nregs * 3, "ssa_uses");
 822   VARRAY_RTX_INIT (ssa_rename_from, nregs * 3, "ssa_rename_from");
 823
 824   ssa_rename_to = (rtx *) alloca (nregs * sizeof(rtx));
 825   bzero ((char *) ssa_rename_to, nregs * sizeof(rtx));
 826
 827   rename_block (0, idom);
 828
 829   /* ??? Update basic_block_live_at_start, and other flow info
 830      as needed.  */
 831
 832   ssa_rename_to = NULL;
 833 }
 834
 835
 836 /* The main entry point for moving to SSA.  */
 837
 838 void
 839 convert_to_ssa()
 840 {
 841   /* Element I is the set of blocks that set register I.  */
 842   sbitmap *evals;
 843
 844   /* Dominator bitmaps.  */
 845   sbitmap *dominators;
 846   sbitmap *dfs;
 847   sbitmap *idfs;
 848
 849   /* Element I is the immediate dominator of block I.  */
 850   int *idom;
 851
 852   int nregs;
 853
 854   /* Don't do it twice.  */
 855   if (in_ssa_form)
 856     abort ();
 857
 858   /* Don't eliminate dead code here.  The CFG we computed above must
 859      remain unchanged until we are finished emerging from SSA form --
 860      the phi node representation depends on it.  */
 861   life_analysis (get_insns (), max_reg_num (), NULL, 0);
 862
 863   /* Compute dominators.  */
 864   dominators = sbitmap_vector_alloc (n_basic_blocks, n_basic_blocks);
 865   compute_flow_dominators (dominators, NULL);
 866
 867   idom = (int *) alloca (n_basic_blocks * sizeof (int));
 868   memset ((void *)idom, -1, (size_t)n_basic_blocks * sizeof (int));
 869   simplify_to_immediate_dominators (idom, dominators);
 870
 871   sbitmap_vector_free (dominators);
 872
 873   if (rtl_dump_file)
 874     {
 875       int i;
 876       fputs (";; Immediate Dominators:\n", rtl_dump_file);
 877       for (i = 0; i < n_basic_blocks; ++i)
 878         fprintf (rtl_dump_file, ";\t%3d = %3d\n", i, idom[i]);
 879       fflush (rtl_dump_file);
 880     }
 881
 882   /* Compute dominance frontiers.  */
 883
 884   dfs = sbitmap_vector_alloc (n_basic_blocks, n_basic_blocks);
 885   compute_dominance_frontiers (dfs, idom);
 886
 887   if (rtl_dump_file)
 888     {
 889       dump_sbitmap_vector (rtl_dump_file, ";; Dominance Frontiers:",
 890                            "; Basic Block", dfs, n_basic_blocks);
 891       fflush (rtl_dump_file);
 892     }
 893
 894   /* Compute register evaluations.  */
 895
 896   ssa_max_reg_num = max_reg_num();
 897   nregs = ssa_max_reg_num - FIRST_PSEUDO_REGISTER;
 898   evals = sbitmap_vector_alloc (nregs, n_basic_blocks);
 899   find_evaluations (evals, nregs);
 900
 901   /* Compute the iterated dominance frontier for each register.  */
 902
 903   idfs = sbitmap_vector_alloc (nregs, n_basic_blocks);
 904   compute_iterated_dominance_frontiers (idfs, dfs, evals, nregs);
 905
 906   if (rtl_dump_file)
 907     {
 908       dump_sbitmap_vector (rtl_dump_file, ";; Iterated Dominance Frontiers:",
 909                            "; Register-FIRST_PSEUDO_REGISTER", idfs, nregs);
 910       fflush (rtl_dump_file);
 911     }
 912
 913   /* Insert the phi nodes.  */
 914
 915   insert_phi_nodes (idfs, evals, nregs);
 916
 917   /* Rename the registers to satisfy SSA.  */
 918
 919   rename_registers (nregs, idom);
 920
 921   /* All done!  Clean up and go home.  */
 922
 923   sbitmap_vector_free (dfs);
 924   sbitmap_vector_free (evals);
 925   sbitmap_vector_free (idfs);
 926   in_ssa_form = 1;
 927
 928   reg_scan (get_insns (), max_reg_num (), 1);
 929 }
 930
 931
 932 /* REG is the representative temporary of its partition.  Add it to the
 933    set of nodes to be processed, if it hasn't been already.  Return the
 934    index of this register in the node set.  */
 935
 936 static inline int
 937 ephi_add_node (reg, nodes, n_nodes)
 938      rtx reg, *nodes;
 939      int *n_nodes;
 940 {
 941   int i;
 942   for (i = *n_nodes - 1; i >= 0; --i)
 943     if (REGNO (reg) == REGNO (nodes[i]))
 944       return i;
 945
 946   nodes[i = (*n_nodes)++] = reg;
 947   return i;
 948 }
 949
 950 /* Part one of the topological sort.  This is a forward (downward) search
 951    through the graph collecting a stack of nodes to process.  Assuming no
 952    cycles, the nodes at top of the stack when we are finished will have
 953    no other dependancies.  */
 954
 955 static int *
 956 ephi_forward (t, visited, succ, tstack)
 957      int t;
 958      sbitmap visited;
 959      sbitmap *succ;
 960      int *tstack;
 961 {
 962   int s;
 963
 964   SET_BIT (visited, t);
 965
 966   EXECUTE_IF_SET_IN_SBITMAP (succ[t], 0, s,
 967     {
 968       if (! TEST_BIT (visited, s))
 969         tstack = ephi_forward (s, visited, succ, tstack);
 970     });
 971
 972   *tstack++ = t;
 973   return tstack;
 974 }
 975
 976 /* Part two of the topological sort.  The is a backward search through
 977    a cycle in the graph, copying the data forward as we go.  */
 978
 979 static void
 980 ephi_backward (t, visited, pred, nodes)
 981      int t;
 982      sbitmap visited, *pred;
 983      rtx *nodes;
 984 {
 985   int p;
 986
 987   SET_BIT (visited, t);
 988
 989   EXECUTE_IF_SET_IN_SBITMAP (pred[t], 0, p,
 990     {
 991       if (! TEST_BIT (visited, p))
 992         {
 993           ephi_backward (p, visited, pred, nodes);
 994           emit_move_insn (nodes[p], nodes[t]);
 995         }
 996     });
 997 }
 998
 999 /* Part two of the topological sort.  Create the copy for a register
1000    and any cycle of which it is a member.  */
1001
1002 static void
1003 ephi_create (t, visited, pred, succ, nodes)
1004      int t;
1005      sbitmap visited, *pred, *succ;
1006      rtx *nodes;
1007 {
1008   rtx reg_u = NULL_RTX;
1009   int unvisited_predecessors = 0;
1010   int p;
1011
1012   /* Iterate through the predecessor list looking for unvisited nodes.
1013      If there are any, we have a cycle, and must deal with that.  At
1014      the same time, look for a visited predecessor.  If there is one,
1015      we won't need to create a temporary.  */
1016
1017   EXECUTE_IF_SET_IN_SBITMAP (pred[t], 0, p,
1018     {
1019       if (! TEST_BIT (visited, p))
1020         unvisited_predecessors = 1;
1021       else if (!reg_u)
1022         reg_u = nodes[p];
1023     });
1024
1025   if (unvisited_predecessors)
1026     {
1027       /* We found a cycle.  Copy out one element of the ring (if necessary),
1028          then traverse the ring copying as we go.  */
1029
1030       if (!reg_u)
1031         {
1032           reg_u = gen_reg_rtx (GET_MODE (nodes[t]));
1033           emit_move_insn (reg_u, nodes[t]);
1034         }
1035
1036       EXECUTE_IF_SET_IN_SBITMAP (pred[t], 0, p,
1037         {
1038           if (! TEST_BIT (visited, p))
1039             {
1040               ephi_backward (p, visited, pred, nodes);
1041               emit_move_insn (nodes[p], reg_u);
1042             }
1043         });
1044     }
1045   else
1046     {
1047       /* No cycle.  Just copy the value from a successor.  */
1048
1049       int s;
1050       EXECUTE_IF_SET_IN_SBITMAP (succ[t], 0, s,
1051         {
1052           SET_BIT (visited, t);
1053           emit_move_insn (nodes[t], nodes[s]);
1054           return;
1055         });
1056     }
1057 }
1058
1059 /* Convert the edge to normal form.  */
1060
1061 static void
1062 eliminate_phi (e, reg_partition)
1063      edge e;
1064      partition reg_partition;
1065 {
1066   int n_nodes;
1067   sbitmap *pred, *succ;
1068   sbitmap visited;
1069   rtx *nodes;
1070   int *stack, *tstack;
1071   rtx insn;
1072   int i;
1073
1074   /* Collect an upper bound on the number of registers needing processing.  */
1075
1076   insn = e->dest->head;
1077   if (GET_CODE (insn) == CODE_LABEL)
1078     insn = next_nonnote_insn (insn);
1079
1080   n_nodes = 0;
1081   while (PHI_NODE_P (insn))
1082     {
1083       insn = next_nonnote_insn (insn);
1084       n_nodes += 2;
1085     }
1086
1087   if (n_nodes == 0)
1088     return;
1089
1090   /* Build the auxilliary graph R(B).
1091
1092      The nodes of the graph are the members of the register partition
1093      present in Phi(B).  There is an edge from FIND(T0)->FIND(T1) for
1094      each T0 = PHI(...,T1,...), where T1 is for the edge from block C.  */
1095
1096   nodes = (rtx *) alloca (n_nodes * sizeof(rtx));
1097   pred = sbitmap_vector_alloc (n_nodes, n_nodes);
1098   succ = sbitmap_vector_alloc (n_nodes, n_nodes);
1099   sbitmap_vector_zero (pred, n_nodes);
1100   sbitmap_vector_zero (succ, n_nodes);
1101
1102   insn = e->dest->head;
1103   if (GET_CODE (insn) == CODE_LABEL)
1104     insn = next_nonnote_insn (insn);
1105
1106   n_nodes = 0;
1107   for (; PHI_NODE_P (insn); insn = next_nonnote_insn (insn))
1108     {
1109       rtx* preg = phi_alternative (PATTERN (insn), e->src->index);
1110       rtx tgt = SET_DEST (PATTERN (insn));
1111       rtx reg;
1112
1113       /* There may be no phi alternative corresponding to this edge.
1114          This indicates that the phi variable is undefined along this
1115          edge.  */
1116       if (preg == NULL)
1117         continue;
1118       reg = *preg;
1119
1120       if (GET_CODE (reg) != REG || GET_CODE (tgt) != REG)
1121         abort();
1122
1123       reg = regno_reg_rtx[partition_find (reg_partition, REGNO (reg))];
1124       tgt = regno_reg_rtx[partition_find (reg_partition, REGNO (tgt))];
1125       /* If the two registers are already in the same partition,
1126          nothing will need to be done.  */
1127       if (reg != tgt)
1128         {
1129           int ireg, itgt;
1130
1131           ireg = ephi_add_node (reg, nodes, &n_nodes);
1132           itgt = ephi_add_node (tgt, nodes, &n_nodes);
1133
1134           SET_BIT (pred[ireg], itgt);
1135           SET_BIT (succ[itgt], ireg);
1136         }
1137     }
1138
1139   if (n_nodes == 0)
1140     goto out;
1141
1142   /* Begin a topological sort of the graph.  */
1143
1144   visited = sbitmap_alloc (n_nodes);
1145   sbitmap_zero (visited);
1146
1147   tstack = stack = (int *) alloca (n_nodes * sizeof (int));
1148
1149   for (i = 0; i < n_nodes; ++i)
1150     if (! TEST_BIT (visited, i))
1151       tstack = ephi_forward (i, visited, succ, tstack);
1152
1153   sbitmap_zero (visited);
1154
1155   /* As we find a solution to the tsort, collect the implementation
1156      insns in a sequence.  */
1157   start_sequence ();
1158
1159   while (tstack != stack)
1160     {
1161       i = *--tstack;
1162       if (! TEST_BIT (visited, i))
1163         ephi_create (i, visited, pred, succ, nodes);
1164     }
1165
1166   insn = gen_sequence ();
1167   end_sequence ();
1168   insert_insn_on_edge (insn, e);
1169   if (rtl_dump_file)
1170     fprintf (rtl_dump_file, "Emitting copy on edge (%d,%d)\n",
1171              e->src->index, e->dest->index);
1172
1173   sbitmap_free (visited);
1174 out:
1175   sbitmap_vector_free (pred);
1176   sbitmap_vector_free (succ);
1177 }
1178
1179
1180 /* For basic block B, consider all phi insns which provide an
1181    alternative corresponding to an incoming abnormal critical edge.
1182    Place the phi alternative corresponding to that abnormal critical
1183    edge in the same register class as the destination of the set.
1184
1185    From Morgan, p. 178:
1186
1187      For each abnormal critical edge (C, B),
1188      if T0 = phi (T1, ..., Ti, ..., Tm) is a phi node in B,
1189      and C is the ith predecessor of B,
1190      then T0 and Ti must be equivalent.
1191
1192    Return non-zero iff any such cases were found for which the two
1193    regs were not already in the same class.  */
1194
1195 static int
1196 make_regs_equivalent_over_bad_edges (bb, reg_partition)
1197      int bb;
1198      partition reg_partition;
1199 {
1200   int changed = 0;
1201   basic_block b = BASIC_BLOCK (bb);
1202   rtx phi = b->head;
1203
1204   /* Advance to the first phi node.  */
1205   if (GET_CODE (phi) == CODE_LABEL)
1206     phi = next_nonnote_insn (phi);
1207
1208   /* Scan all the phi nodes.  */
1209   for (;
1210        PHI_NODE_P (phi);
1211        phi = next_nonnote_insn (phi))
1212     {
1213       edge e;
1214       int tgt_regno;
1215       rtx set = PATTERN (phi);
1216       rtx tgt = SET_DEST (set);
1217
1218       /* The set target is expected to be a pseudo.  */
1219       if (GET_CODE (tgt) != REG
1220           || REGNO (tgt) < FIRST_PSEUDO_REGISTER)
1221         abort ();
1222       tgt_regno = REGNO (tgt);
1223
1224       /* Scan incoming abnormal critical edges.  */
1225       for (e = b->pred; e; e = e->pred_next)
1226         if (e->flags & (EDGE_ABNORMAL | EDGE_CRITICAL))
1227           {
1228             rtx *alt = phi_alternative (set, e->src->index);
1229             int alt_regno;
1230
1231             /* If there is no alternative corresponding to this edge,
1232                the value is undefined along the edge, so just go on.  */
1233             if (alt == 0)
1234               continue;
1235
1236             /* The phi alternative is expected to be a pseudo.  */
1237             if (GET_CODE (*alt) != REG
1238                 || REGNO (*alt) < FIRST_PSEUDO_REGISTER)
1239               abort ();
1240             alt_regno = REGNO (*alt);
1241
1242             /* If the set destination and the phi alternative aren't
1243                already in the same class...  */
1244             if (partition_find (reg_partition, tgt_regno)
1245                 != partition_find (reg_partition, alt_regno))
1246               {
1247                 /* ... make them such.  */
1248                 partition_union (reg_partition,
1249                                  tgt_regno, alt_regno);
1250                 ++changed;
1251               }
1252           }
1253     }
1254
1255   return changed;
1256 }
1257
1258
1259 /* Consider phi insns in basic block BB pairwise.  If the set target
1260    of both isns are equivalent pseudos, make the corresponding phi
1261    alternatives in each phi corresponding equivalent.
1262
1263    Return nonzero if any new register classes were unioned.  */
1264
1265 static int
1266 make_equivalent_phi_alternatives_equivalent (bb, reg_partition)
1267      int bb;
1268      partition reg_partition;
1269 {
1270   int changed = 0;
1271   rtx phi = BLOCK_HEAD (bb);
1272   basic_block b = BASIC_BLOCK (bb);
1273
1274   /* Advance to the first phi node.  */
1275   if (GET_CODE (phi) == CODE_LABEL)
1276     phi = next_nonnote_insn (phi);
1277
1278   /* Scan all the phi nodes.  */
1279   for (;
1280        PHI_NODE_P (phi);
1281        phi = next_nonnote_insn (phi))
1282     {
1283       rtx set = PATTERN (phi);
1284       /* The regno of the destination of the set.  */
1285       int tgt_regno = REGNO (SET_DEST (PATTERN (phi)));
1286
1287       rtx phi2 = next_nonnote_insn (phi);
1288
1289       /* Scan all phi nodes following this one.  */
1290       for (;
1291            PHI_NODE_P (phi2);
1292            phi2 = next_nonnote_insn (phi2))
1293         {
1294           rtx set2 = PATTERN (phi2);
1295           /* The regno of the destination of the set.  */
1296           int tgt2_regno = REGNO (SET_DEST (set2));
1297
1298           /* Are the set destinations equivalent regs?  */
1299           if (partition_find (reg_partition, tgt_regno) ==
1300               partition_find (reg_partition, tgt2_regno))
1301             {
1302               edge e;
1303               /* Scan over edges.  */
1304               for (e = b->pred; e; e = e->pred_next)
1305                 {
1306                   int pred_block = e->src->index;
1307                   /* Identify the phi altnernatives from both phi
1308                      nodes corresponding to this edge.  */
1309                   rtx *alt = phi_alternative (set, pred_block);
1310                   rtx *alt2 = phi_alternative (set2, pred_block);
1311
1312                   /* If one of the phi nodes doesn't have a
1313                      corresponding alternative, just skip it.  */
1314                   if (alt == 0 || alt2 == 0)
1315                     continue;
1316
1317                   /* Both alternatives should be pseudos.  */
1318                   if (GET_CODE (*alt) != REG
1319                       || REGNO (*alt) < FIRST_PSEUDO_REGISTER)
1320                     abort ();
1321                   if (GET_CODE (*alt2) != REG
1322                       || REGNO (*alt2) < FIRST_PSEUDO_REGISTER)
1323                     abort ();
1324
1325                   /* If the altneratives aren't already in the same
1326                      class ... */
1327                   if (partition_find (reg_partition, REGNO (*alt))
1328                       != partition_find (reg_partition, REGNO (*alt2)))
1329                     {
1330                       /* ... make them so.  */
1331                       partition_union (reg_partition,
1332                                        REGNO (*alt), REGNO (*alt2));
1333                       ++changed;
1334                     }
1335                 }
1336             }
1337         }
1338     }
1339
1340   return changed;
1341 }
1342
1343 /* Compute a conservative partition of outstanding pseudo registers.
1344    See Morgan 7.3.1.  */
1345
1346 static partition
1347 compute_conservative_reg_partition ()
1348 {
1349   int bb;
1350   int changed = 0;
1351
1352   /* We don't actually work with hard registers, but it's easier to
1353      carry them around anyway rather than constantly doing register
1354      number arithmetic.  */
1355   partition p =
1356     partition_new (ssa_definition->num_elements + FIRST_PSEUDO_REGISTER);
1357
1358   /* The first priority is to make sure registers that might have to
1359      be copied on abnormal critical edges are placed in the same
1360      partition.  This saves us from having to split abnormal critical
1361      edges.  */
1362   for (bb = n_basic_blocks; --bb >= 0; )
1363     changed += make_regs_equivalent_over_bad_edges (bb, p);
1364
1365   /* Now we have to insure that corresponding arguments of phi nodes
1366      assigning to corresponding regs are equivalent.  Iterate until
1367      nothing changes.  */
1368   while (changed > 0)
1369     {
1370       changed = 0;
1371       for (bb = n_basic_blocks; --bb >= 0; )
1372         changed += make_equivalent_phi_alternatives_equivalent (bb, p);
1373     }
1374
1375   return p;
1376 }
1377
1378 /* The following functions compute a register partition that attempts
1379    to eliminate as many reg copies and phi node copies as possible by
1380    coalescing registers.   This is the strategy:
1381
1382     1. As in the conservative case, the top priority is to coalesce
1383        registers that otherwise would cause copies to be placed on
1384        abnormal critical edges (which isn't possible).
1385
1386     2. Figure out which regs are involved (in the LHS or RHS) of
1387        copies and phi nodes.  Compute conflicts among these regs.
1388
1389     3. Walk around the instruction stream, placing two regs in the
1390        same class of the partition if one appears on the LHS and the
1391        other on the RHS of a copy or phi node and the two regs don't
1392        conflict.  The conflict information of course needs to be
1393        updated.
1394
1395     4. If anything has changed, there may be new opportunities to
1396        coalesce regs, so go back to 2.
1397 */
1398
1399 /* If REG1 and REG2 don't conflict in CONFLICTS, place them in the
1400    same class of partition P, if they aren't already.  Update
1401    CONFLICTS appropriately.
1402
1403    Returns one if REG1 and REG2 were placed in the same class but were
1404    not previously; zero otherwise.
1405
1406    See Morgan figure 11.15.  */
1407
1408 static int
1409 coalesce_if_unconflicting (p, conflicts, reg1, reg2)
1410      partition p;
1411      conflict_graph conflicts;
1412      int reg1;
1413      int reg2;
1414 {
1415   int reg;
1416
1417   /* Don't mess with hard regs.  */
1418   if (reg1 < FIRST_PSEUDO_REGISTER || reg2 < FIRST_PSEUDO_REGISTER)
1419     return 0;
1420
1421   /* Find the canonical regs for the classes containing REG1 and
1422      REG2.  */
1423   reg1 = partition_find (p, reg1);
1424   reg2 = partition_find (p, reg2);
1425
1426   /* If they're already in the same class, there's nothing to do.  */
1427   if (reg1 == reg2)
1428     return 0;
1429
1430   /* If the regs conflict, our hands are tied.  */
1431   if (conflict_graph_conflict_p (conflicts, reg1, reg2))
1432     return 0;
1433
1434   /* We're good to go.  Put the regs in the same partition.  */
1435   partition_union (p, reg1, reg2);
1436
1437   /* Find the new canonical reg for the merged class.  */
1438   reg = partition_find (p, reg1);
1439
1440   /* Merge conflicts from the two previous classes.  */
1441   conflict_graph_merge_regs (conflicts, reg, reg1);
1442   conflict_graph_merge_regs (conflicts, reg, reg2);
1443
1444   return 1;
1445 }
1446
1447 /* For each register copy insn in basic block BB, place the LHS and
1448    RHS regs in the same class in partition P if they do not conflict
1449    according to CONFLICTS.
1450
1451    Returns the number of changes that were made to P.
1452
1453    See Morgan figure 11.14.  */
1454
1455 static int
1456 coalesce_regs_in_copies (bb, p, conflicts)
1457      int bb;
1458      partition p;
1459      conflict_graph conflicts;
1460 {
1461   int changed = 0;
1462   rtx insn;
1463   rtx end = BLOCK_END (bb);
1464
1465   /* Scan the instruction stream of the block.  */
1466   for (insn = BLOCK_HEAD (bb); insn != end; insn = NEXT_INSN (insn))
1467     {
1468       rtx pattern;
1469       rtx src;
1470       rtx dest;
1471
1472       /* If this isn't a set insn, go to the next insn.  */
1473       if (GET_CODE (insn) != INSN)
1474         continue;
1475       pattern = PATTERN (insn);
1476       if (GET_CODE (pattern) != SET)
1477         continue;
1478
1479       src = SET_SRC (pattern);
1480       dest = SET_DEST (pattern);
1481
1482       /* If src or dest are subregs, find the underlying reg.  */
1483       while (GET_CODE (src) == SUBREG
1484              && SUBREG_WORD (src) != 0)
1485         src = SUBREG_REG (src);
1486       while (GET_CODE (dest) == SUBREG
1487              && SUBREG_WORD (dest) != 0)
1488         dest = SUBREG_REG (dest);
1489
1490       /* We're only looking for copies.  */
1491       if (GET_CODE (src) != REG || GET_CODE (dest) != REG)
1492         continue;
1493
1494       /* Coalesce only if the reg modes are the same.  As long as
1495          each reg's rtx is unique, it can have only one mode, so two
1496          pseudos of different modes can't be coalesced into one.
1497
1498          FIXME: We can probably get around this by inserting SUBREGs
1499          where appropriate, but for now we don't bother.  */
1500       if (GET_MODE (src) != GET_MODE (dest))
1501         continue;
1502
1503       /* Found a copy; see if we can use the same reg for both the
1504          source and destination (and thus eliminate the copy,
1505          ultimately).  */
1506       changed += coalesce_if_unconflicting (p, conflicts,
1507                                             REGNO (src), REGNO (dest));
1508     }
1509
1510   return changed;
1511 }
1512
1513
1514 struct phi_coalesce_context
1515 {
1516   partition p;
1517   conflict_graph conflicts;
1518   int changed;
1519 };
1520
1521 /* Callback function for for_each_successor_phi.  If the set
1522    destination and the phi alternative regs do not conflict, place
1523    them in the same paritition class.  DATA is a pointer to a
1524    phi_coalesce_context struct.  */
1525
1526 static int
1527 coalesce_reg_in_phi (insn, dest_regno, src_regno, data)
1528      rtx insn ATTRIBUTE_UNUSED;
1529      int dest_regno;
1530      int src_regno;
1531      void *data;
1532 {
1533   struct phi_coalesce_context *context =
1534     (struct phi_coalesce_context *) data;
1535
1536   /* Attempt to use the same reg, if they don't conflict.  */
1537   context->changed
1538     += coalesce_if_unconflicting (context->p, context->conflicts,
1539                                   dest_regno, src_regno);
1540   return 0;
1541 }
1542
1543 /* For each alternative in a phi function corresponding to basic block
1544    BB (in phi nodes in successor block to BB), place the reg in the
1545    phi alternative and the reg to which the phi value is set into the
1546    same class in partition P, if allowed by CONFLICTS.
1547
1548    Return the number of changes that were made to P.
1549
1550    See Morgan figure 11.14.  */
1551
1552 static int
1553 coalesce_regs_in_successor_phi_nodes (bb, p, conflicts)
1554      int bb;
1555      partition p;
1556      conflict_graph conflicts;
1557 {
1558   struct phi_coalesce_context context;
1559   context.p = p;
1560   context.conflicts = conflicts;
1561   context.changed = 0;
1562
1563   for_each_successor_phi (bb, &coalesce_reg_in_phi, &context);
1564
1565   return context.changed;
1566 }
1567
1568 /* Compute and return a partition of pseudos.  Where possible,
1569    non-conflicting pseudos are placed in the same class.
1570
1571    The caller is responsible for deallocating the returned partition.  */
1572
1573 static partition
1574 compute_coalesced_reg_partition ()
1575 {
1576   int bb;
1577   int changed = 0;
1578
1579   /* We don't actually work with hard registers, but it's easier to
1580      carry them around anyway rather than constantly doing register
1581      number arithmetic.  */
1582   partition p =
1583     partition_new (ssa_definition->num_elements + FIRST_PSEUDO_REGISTER);
1584
1585   /* The first priority is to make sure registers that might have to
1586      be copied on abnormal critical edges are placed in the same
1587      partition.  This saves us from having to split abnormal critical
1588      edges (which can't be done).  */
1589   for (bb = n_basic_blocks; --bb >= 0; )
1590     make_regs_equivalent_over_bad_edges (bb, p);
1591
1592   do
1593     {
1594       regset_head phi_set;
1595       conflict_graph conflicts;
1596
1597       changed = 0;
1598
1599       /* Build the set of registers involved in phi nodes, either as
1600          arguments to the phi function or as the target of a set.  */
1601       INITIALIZE_REG_SET (phi_set);
1602       mark_phi_and_copy_regs (&phi_set);
1603
1604       /* Compute conflicts.  */
1605       conflicts = conflict_graph_compute (&phi_set, p);
1606
1607       /* FIXME: Better would be to process most frequently executed
1608          blocks first, so that most frequently executed copies would
1609          be more likely to be removed by register coalescing.  But any
1610          order will generate correct, if non-optimal, results.  */
1611       for (bb = n_basic_blocks; --bb >= 0; )
1612         {
1613           changed += coalesce_regs_in_copies (bb, p, conflicts);
1614           changed += coalesce_regs_in_successor_phi_nodes (bb, p, conflicts);
1615         }
1616
1617       conflict_graph_delete (conflicts);
1618     }
1619   while (changed > 0);
1620
1621   return p;
1622 }
1623
1624 /* Mark the regs in a phi node.  PTR is a phi expression or one of its
1625    components (a REG or a CONST_INT).  DATA is a reg set in which to
1626    set all regs.  Called from for_each_rtx.  */
1627
1628 static int
1629 mark_reg_in_phi (ptr, data)
1630      rtx *ptr;
1631      void *data;
1632 {
1633   rtx expr = *ptr;
1634   regset set = (regset) data;
1635
1636   switch (GET_CODE (expr))
1637     {
1638     case REG:
1639       SET_REGNO_REG_SET (set, REGNO (expr));
1640       /* Fall through.  */
1641     case CONST_INT:
1642     case PHI:
1643       return 0;
1644     default:
1645       abort ();
1646     }
1647 }
1648
1649 /* Mark in PHI_SET all pseudos that are used in a phi node -- either
1650    set from a phi expression, or used as an argument in one.  Also
1651    mark regs that are the source or target of a reg copy.  Uses
1652    ssa_definition.  */
1653
1654 static void
1655 mark_phi_and_copy_regs (phi_set)
1656      regset phi_set;
1657 {
1658   int reg;
1659
1660   /* Scan the definitions of all regs.  */
1661   for (reg = VARRAY_SIZE (ssa_definition);
1662        --reg >= FIRST_PSEUDO_REGISTER;
1663        )
1664     {
1665       rtx insn = VARRAY_RTX (ssa_definition, reg);
1666       rtx pattern;
1667       rtx src;
1668
1669       if (insn == NULL)
1670         continue;
1671       pattern = PATTERN (insn);
1672       /* Sometimes we get PARALLEL insns.  These aren't phi nodes or
1673          copies.  */
1674       if (GET_CODE (pattern) != SET)
1675         continue;
1676       src = SET_SRC (pattern);
1677
1678       if (GET_CODE (src) == REG)
1679         {
1680           /* It's a reg copy.  */
1681           SET_REGNO_REG_SET (phi_set, reg);
1682           SET_REGNO_REG_SET (phi_set, REGNO (src));
1683         }
1684       else if (GET_CODE (src) == PHI)
1685         {
1686           /* It's a phi node.  Mark the reg being set.  */
1687           SET_REGNO_REG_SET (phi_set, reg);
1688           /* Mark the regs used in the phi function.  */
1689           for_each_rtx (&src, mark_reg_in_phi, phi_set);
1690         }
1691       /* ... else nothing to do.  */
1692     }
1693 }
1694
1695 /* Rename regs in insn PTR that are equivalent.  DATA is the register
1696    partition which specifies equivalences.  */
1697
1698 static int
1699 rename_equivalent_regs_in_insn (ptr, data)
1700      rtx *ptr;
1701      void* data;
1702 {
1703   rtx x = *ptr;
1704   partition reg_partition = (partition) data;
1705
1706   if (x == NULL_RTX)
1707     return 0;
1708
1709   switch (GET_CODE (x))
1710     {
1711     case SET:
1712       {
1713         rtx *destp = &SET_DEST (x);
1714         rtx dest = SET_DEST (x);
1715
1716         /* Subregs at word 0 are interesting.  Subregs at word != 0 are
1717            presumed to be part of a contiguous multi-word set sequence.  */
1718         while (GET_CODE (dest) == SUBREG
1719                && SUBREG_WORD (dest) == 0)
1720           {
1721             destp = &SUBREG_REG (dest);
1722             dest = SUBREG_REG (dest);
1723           }
1724
1725         if (GET_CODE (dest) == REG
1726             && REGNO (dest) >= FIRST_PSEUDO_REGISTER)
1727           {
1728             /* Got a pseudo; replace it.  */
1729             int regno = REGNO (dest);
1730             int new_regno = partition_find (reg_partition, regno);
1731             if (regno != new_regno)
1732               *destp = regno_reg_rtx[new_regno];
1733
1734             for_each_rtx (&SET_SRC (x),
1735                           rename_equivalent_regs_in_insn,
1736                           data);
1737             return -1;
1738           }
1739
1740         /* Otherwise, this was not an interesting destination.  Continue
1741            on, marking uses as normal.  */
1742         return 0;
1743       }
1744
1745     case REG:
1746       if (REGNO (x) >= FIRST_PSEUDO_REGISTER)
1747         {
1748           int regno = REGNO (x);
1749           int new_regno = partition_find (reg_partition, regno);
1750           if (regno != new_regno)
1751             {
1752               rtx new_reg = regno_reg_rtx[new_regno];
1753               if (GET_MODE (x) != GET_MODE (new_reg))
1754                 abort ();
1755               *ptr = new_reg;
1756             }
1757         }
1758       return -1;
1759
1760     case PHI:
1761       /* No need to rename the phi nodes.  We'll check equivalence
1762          when inserting copies.  */
1763       return -1;
1764
1765     default:
1766       /* Anything else, continue traversing.  */
1767       return 0;
1768     }
1769 }
1770
1771 /* Rename regs that are equivalent in REG_PARTITION.  */
1772
1773 static void
1774 rename_equivalent_regs (reg_partition)
1775      partition reg_partition;
1776 {
1777   int bb;
1778
1779   for (bb = n_basic_blocks; --bb >= 0; )
1780     {
1781       basic_block b = BASIC_BLOCK (bb);
1782       rtx next = b->head;
1783       rtx last = b->end;
1784       rtx insn;
1785
1786       do
1787         {
1788           insn = next;
1789           if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
1790             {
1791               for_each_rtx (&PATTERN (insn),
1792                             rename_equivalent_regs_in_insn,
1793                             reg_partition);
1794               for_each_rtx (&REG_NOTES (insn),
1795                             rename_equivalent_regs_in_insn,
1796                             reg_partition);
1797             }
1798
1799           next = NEXT_INSN (insn);
1800         }
1801       while (insn != last);
1802     }
1803 }
1804
1805 /* The main entry point for moving from SSA.  */
1806
1807 void
1808 convert_from_ssa()
1809 {
1810   int bb;
1811   partition reg_partition;
1812   rtx insns = get_insns ();
1813
1814   /* We need up-to-date life information.  */
1815   life_analysis (insns, max_reg_num (), NULL, 0);
1816
1817   /* Figure out which regs in copies and phi nodes don't conflict and
1818      therefore can be coalesced.  */
1819   if (conservative_reg_partition)
1820     reg_partition = compute_conservative_reg_partition ();
1821   else
1822     reg_partition = compute_coalesced_reg_partition ();
1823
1824   rename_equivalent_regs (reg_partition);
1825
1826   /* Eliminate the PHI nodes.  */
1827   for (bb = n_basic_blocks; --bb >= 0; )
1828     {
1829       basic_block b = BASIC_BLOCK (bb);
1830       edge e;
1831
1832       for (e = b->pred; e; e = e->pred_next)
1833         if (e->src != ENTRY_BLOCK_PTR)
1834           eliminate_phi (e, reg_partition);
1835     }
1836
1837   partition_delete (reg_partition);
1838
1839   /* Actually delete the PHI nodes.  */
1840   for (bb = n_basic_blocks; --bb >= 0; )
1841     {
1842       rtx insn = BLOCK_HEAD (bb);
1843       int start = (GET_CODE (insn) != CODE_LABEL);
1844
1845       if (! start)
1846         insn = next_nonnote_insn (insn);
1847       while (PHI_NODE_P (insn))
1848         {
1849           /* If a phi node is the last insn in the block, there must
1850              have been nothing else.  Set the block end to the block
1851              head.  */
1852           if (insn == BLOCK_END (bb))
1853             BLOCK_END (bb) = BLOCK_HEAD (bb);
1854           insn = delete_insn (insn);
1855           if (GET_CODE (insn) == NOTE)
1856             insn = next_nonnote_insn (insn);
1857         }
1858       if (start)
1859         BLOCK_HEAD (bb) = insn;
1860     }
1861
1862   /* Commit all the copy nodes needed to convert out of SSA form.  */
1863   commit_edge_insertions ();
1864
1865   in_ssa_form = 0;
1866
1867   count_or_remove_death_notes (NULL, 1);
1868 }
1869
1870 /* Scan phi nodes in successors to BB.  For each such phi node that
1871    has a phi alternative value corresponding to BB, invoke FN.  FN
1872    is passed the entire phi node insn, the regno of the set
1873    destination, the regno of the phi argument corresponding to BB,
1874    and DATA.
1875
1876    If FN ever returns non-zero, stops immediately and returns this
1877    value.  Otherwise, returns zero.  */
1878
1879 int
1880 for_each_successor_phi (bb, fn, data)
1881      int bb;
1882      successor_phi_fn fn;
1883      void *data;
1884 {
1885   basic_block block;
1886   edge e;
1887
1888   if (bb == EXIT_BLOCK)
1889     return 0;
1890   else if (bb == ENTRY_BLOCK)
1891     block = ENTRY_BLOCK_PTR;
1892   else
1893     block = BASIC_BLOCK (bb);
1894
1895   /* Scan outgoing edges.  */
1896   for (e = block->succ; e != NULL; e = e->succ_next)
1897     {
1898       rtx insn;
1899
1900       basic_block successor = e->dest;
1901       if (successor->index == ENTRY_BLOCK
1902           || successor->index == EXIT_BLOCK)
1903         continue;
1904
1905       /* Advance to the first non-label insn of the successor block.  */
1906       insn = successor->head;
1907       while (insn != NULL
1908              && (GET_CODE (insn) == CODE_LABEL
1909                  || GET_CODE (insn) == NOTE))
1910         insn = NEXT_INSN (insn);
1911
1912       if (insn == NULL)
1913         continue;
1914
1915       /* Scan phi nodes in the successor.  */
1916       for ( ; PHI_NODE_P (insn); insn = NEXT_INSN (insn))
1917         {
1918           int result;
1919           rtx phi_set = PATTERN (insn);
1920           rtx *alternative = phi_alternative (phi_set, block->index);
1921           rtx phi_src;
1922
1923           /* This phi function may not have an alternative
1924              corresponding to the incoming edge, indicating the
1925              assigned variable is not defined along the edge.  */
1926           if (alternative == NULL)
1927             continue;
1928           phi_src = *alternative;
1929
1930           /* Invoke the callback.  */
1931           result = (*fn) (insn, REGNO (SET_DEST (phi_set)),
1932                           REGNO (phi_src), data);
1933
1934           /* Terminate if requested.  */
1935           if (result != 0)
1936             return result;
1937         }
1938     }
1939
1940   return 0;
1941 }