gcc/ssa.c

   1 /* Static Single Assignment conversion routines for the GNU compiler.
   2    Copyright (C) 2000 Free Software Foundation, Inc.
   3
   4 This file is part of GNU CC.
   5
   6 GNU CC is free software; you can redistribute it and/or modify it
   7 under the terms of the GNU General Public License as published by the
   8 Free Software Foundation; either version 2, or (at your option) any
   9 later version.
  10
  11 GNU CC is distributed in the hope that it will be useful, but WITHOUT
  12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GNU CC; see the file COPYING.  If not, write to the Free
  18 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  19 02111-1307, USA.  */
  20
  21 /* References:
  22
  23    Building an Optimizing Compiler
  24    Robert Morgan
  25    Butterworth-Heinemann, 1998
  26
  27    Static Single Assignment Construction
  28    Preston Briggs, Tim Harvey, Taylor Simpson
  29    Technical Report, Rice University, 1995
  30    ftp://ftp.cs.rice.edu/public/preston/optimizer/SSA.ps.gz
  31 */
  32
  33 #include "config.h"
  34 #include "system.h"
  35
  36 #include "rtl.h"
  37 #include "regs.h"
  38 #include "hard-reg-set.h"
  39 #include "flags.h"
  40 #include "function.h"
  41 #include "real.h"
  42 #include "insn-config.h"
  43 #include "recog.h"
  44 #include "basic-block.h"
  45 #include "output.h"
  46 #include "partition.h"
  47
  48
  49 /* TODO:
  50
  51    Handle subregs better, maybe.  For now, if a reg that's set in a
  52    subreg expression is duplicated going into SSA form, an extra copy
  53    is inserted first that copies the entire reg into the duplicate, so
  54    that the other bits are preserved.  This isn't strictly SSA, since
  55    at least part of the reg is assigned in more than one place (though
  56    they are adjacent).
  57
  58    ??? What to do about strict_low_part.  Probably I'll have to split
  59    them out of their current instructions first thing.
  60
  61    Actually the best solution may be to have a kind of "mid-level rtl"
  62    in which the RTL encodes exactly what we want, without exposing a
  63    lot of niggling processor details.  At some later point we lower
  64    the representation, calling back into optabs to finish any necessary
  65    expansion.  */
  66
  67
  68 /* If conservative_reg_partition is non-zero, use a conservative
  69    register partitioning algorithm (which leaves more regs after
  70    emerging from SSA) instead of the coalescing one.  This is being
  71    left in for a limited time only, as a debugging tool until the
  72    coalescing algorithm is validated.  */
  73 static int conservative_reg_partition;
  74
  75 /* This flag is set when the CFG is in SSA form.  */
  76 int in_ssa_form = 0;
  77
  78 /* Element I is the single instruction that sets register I+PSEUDO.  */
  79 varray_type ssa_definition;
  80
  81 /* Element I is an INSN_LIST of instructions that use register I+PSEUDO.  */
  82 varray_type ssa_uses;
  83
  84 /* Element I-PSEUDO is the normal register that originated the ssa
  85    register in question.  */
  86 varray_type ssa_rename_from;
  87
  88 /* The running target ssa register for a given normal register.  */
  89 static rtx *ssa_rename_to;
  90
  91 /* The number of registers that were live on entry to the SSA routines.  */
  92 static unsigned int ssa_max_reg_num;
  93
  94 /* Local function prototypes.  */
  95
  96 static inline rtx * phi_alternative
  97   PARAMS ((rtx, int));
  98
  99 static int remove_phi_alternative
 100   PARAMS ((rtx, int));
 101 static void simplify_to_immediate_dominators
 102   PARAMS ((int *idom, sbitmap *dominators));
 103 static void compute_dominance_frontiers_1
 104   PARAMS ((sbitmap *frontiers, int *idom, int bb, sbitmap done));
 105 static void compute_dominance_frontiers
 106   PARAMS ((sbitmap *frontiers, int *idom));
 107 static void find_evaluations_1
 108   PARAMS ((rtx dest, rtx set, void *data));
 109 static void find_evaluations
 110   PARAMS ((sbitmap *evals, int nregs));
 111 static void compute_iterated_dominance_frontiers
 112   PARAMS ((sbitmap *idfs, sbitmap *frontiers, sbitmap *evals, int nregs));
 113 static void insert_phi_node
 114   PARAMS ((int regno, int b));
 115 static void insert_phi_nodes
 116   PARAMS ((sbitmap *idfs, sbitmap *evals, int nregs));
 117 static int rename_insn_1
 118   PARAMS ((rtx *ptr, void *data));
 119 static void rename_block
 120   PARAMS ((int b, int *idom));
 121 static void rename_registers
 122   PARAMS ((int nregs, int *idom));
 123
 124 static inline int ephi_add_node
 125   PARAMS ((rtx reg, rtx *nodes, int *n_nodes));
 126 static int * ephi_forward
 127   PARAMS ((int t, sbitmap visited, sbitmap *succ, int *tstack));
 128 static void ephi_backward
 129   PARAMS ((int t, sbitmap visited, sbitmap *pred, rtx *nodes));
 130 static void ephi_create
 131   PARAMS ((int t, sbitmap visited, sbitmap *pred, sbitmap *succ, rtx *nodes));
 132 static void eliminate_phi
 133   PARAMS ((edge e, partition reg_partition));
 134 static int make_regs_equivalent_over_bad_edges
 135   PARAMS ((int bb, partition reg_partition));
 136
 137 /* These are used only in the conservative register partitioning
 138    algorithms.  */
 139 static int make_equivalent_phi_alternatives_equivalent
 140   PARAMS ((int bb, partition reg_partition));
 141 static partition compute_conservative_reg_partition
 142   PARAMS ((void));
 143 static int rename_equivalent_regs_in_insn
 144   PARAMS ((rtx *ptr, void *data));
 145
 146 /* These are used in the register coalescing algorithm.  */
 147 static int coalesce_if_unconflicting
 148   PARAMS ((partition p, conflict_graph conflicts, int reg1, int reg2));
 149 static int coalesce_regs_in_copies
 150   PARAMS ((basic_block bb, partition p, conflict_graph conflicts));
 151 static int coalesce_reg_in_phi
 152   PARAMS ((rtx, int dest_regno, int src_regno, void *data));
 153 static int coalesce_regs_in_successor_phi_nodes
 154   PARAMS ((basic_block bb, partition p, conflict_graph conflicts));
 155 static partition compute_coalesced_reg_partition
 156   PARAMS (());
 157 static int mark_reg_in_phi
 158   PARAMS ((rtx *ptr, void *data));
 159 static void mark_phi_and_copy_regs
 160   PARAMS ((regset phi_set));
 161
 162 static int rename_equivalent_regs_in_insn
 163   PARAMS ((rtx *ptr, void *data));
 164 static void rename_equivalent_regs
 165   PARAMS ((partition reg_partition));
 166
 167
 168 /* Given the SET of a PHI node, return the address of the alternative
 169    for predecessor block C.  */
 170
 171 static inline rtx *
 172 phi_alternative (set, c)
 173      rtx set;
 174      int c;
 175 {
 176   rtvec phi_vec = XVEC (SET_SRC (set), 0);
 177   int v;
 178
 179   for (v = GET_NUM_ELEM (phi_vec) - 2; v >= 0; v -= 2)
 180     if (INTVAL (RTVEC_ELT (phi_vec, v + 1)) == c)
 181       return &RTVEC_ELT (phi_vec, v);
 182
 183   return NULL;
 184 }
 185
 186 /* Given the SET of a phi node, remove the alternative for predecessor
 187    block C.  Return non-zero on success, or zero if no alternative is
 188    found for C.  */
 189
 190 static int
 191 remove_phi_alternative (set, c)
 192      rtx set;
 193      int c;
 194 {
 195   rtvec phi_vec = XVEC (SET_SRC (set), 0);
 196   int num_elem = GET_NUM_ELEM (phi_vec);
 197   int v;
 198
 199   for (v = num_elem - 2; v >= 0; v -= 2)
 200     if (INTVAL (RTVEC_ELT (phi_vec, v + 1)) == c)
 201       {
 202         if (v < num_elem - 2)
 203           {
 204             RTVEC_ELT (phi_vec, v) = RTVEC_ELT (phi_vec, num_elem - 2);
 205             RTVEC_ELT (phi_vec, v + 1) = RTVEC_ELT (phi_vec, num_elem - 1);
 206           }
 207         PUT_NUM_ELEM (phi_vec, num_elem - 2);
 208         return 1;
 209       }
 210
 211   return 0;
 212 }
 213
 214 /* Computing the Immediate Dominators:
 215
 216    Throughout, we don't actually want the full dominators set as
 217    calculated by flow, but rather the immediate dominators.
 218 */
 219
 220 static void
 221 simplify_to_immediate_dominators (idom, dominators)
 222      int *idom;
 223      sbitmap *dominators;
 224 {
 225   sbitmap *tmp;
 226   int b;
 227
 228   tmp = sbitmap_vector_alloc (n_basic_blocks, n_basic_blocks);
 229
 230   /* Begin with tmp(n) = dom(n) - { n }.  */
 231   for (b = n_basic_blocks; --b >= 0; )
 232     {
 233       sbitmap_copy (tmp[b], dominators[b]);
 234       RESET_BIT (tmp[b], b);
 235     }
 236
 237   /* Subtract out all of our dominator's dominators.  */
 238   for (b = n_basic_blocks; --b >= 0; )
 239     {
 240       sbitmap tmp_b = tmp[b];
 241       int s;
 242
 243       for (s = n_basic_blocks; --s >= 0; )
 244         if (TEST_BIT (tmp_b, s))
 245           sbitmap_difference (tmp_b, tmp_b, tmp[s]);
 246     }
 247
 248   /* Find the one bit set in the bitmap and put it in the output array.  */
 249   for (b = n_basic_blocks; --b >= 0; )
 250     {
 251       int t;
 252       EXECUTE_IF_SET_IN_SBITMAP (tmp[b], 0, t, { idom[b] = t; });
 253     }
 254
 255   sbitmap_vector_free (tmp);
 256 }
 257
 258
 259 /* For all registers, find all blocks in which they are set.
 260
 261    This is the transform of what would be local kill information that
 262    we ought to be getting from flow.  */
 263
 264 static sbitmap *fe_evals;
 265 static int fe_current_bb;
 266
 267 static void
 268 find_evaluations_1 (dest, set, data)
 269      rtx dest;
 270      rtx set ATTRIBUTE_UNUSED;
 271      void *data ATTRIBUTE_UNUSED;
 272 {
 273   if (GET_CODE (dest) == REG
 274       && REGNO (dest) >= FIRST_PSEUDO_REGISTER)
 275     SET_BIT (fe_evals[REGNO (dest) - FIRST_PSEUDO_REGISTER], fe_current_bb);
 276 }
 277
 278 static void
 279 find_evaluations (evals, nregs)
 280      sbitmap *evals;
 281      int nregs;
 282 {
 283   int bb;
 284
 285   sbitmap_vector_zero (evals, nregs);
 286   fe_evals = evals;
 287
 288   for (bb = n_basic_blocks; --bb >= 0; )
 289     {
 290       rtx p, last;
 291
 292       fe_current_bb = bb;
 293       p = BLOCK_HEAD (bb);
 294       last = BLOCK_END (bb);
 295       while (1)
 296         {
 297           if (GET_RTX_CLASS (GET_CODE (p)) == 'i')
 298             note_stores (PATTERN (p), find_evaluations_1, NULL);
 299
 300           if (p == last)
 301             break;
 302           p = NEXT_INSN (p);
 303         }
 304     }
 305 }
 306
 307
 308 /* Computing the Dominance Frontier:
 309
 310    As decribed in Morgan, section 3.5, this may be done simply by
 311    walking the dominator tree bottom-up, computing the frontier for
 312    the children before the parent.  When considering a block B,
 313    there are two cases:
 314
 315    (1) A flow graph edge leaving B that does not lead to a child
 316    of B in the dominator tree must be a block that is either equal
 317    to B or not dominated by B.  Such blocks belong in the frontier
 318    of B.
 319
 320    (2) Consider a block X in the frontier of one of the children C
 321    of B.  If X is not equal to B and is not dominated by B, it
 322    is in the frontier of B.
 323 */
 324
 325 static void
 326 compute_dominance_frontiers_1 (frontiers, idom, bb, done)
 327      sbitmap *frontiers;
 328      int *idom;
 329      int bb;
 330      sbitmap done;
 331 {
 332   basic_block b = BASIC_BLOCK (bb);
 333   edge e;
 334   int c;
 335
 336   SET_BIT (done, bb);
 337   sbitmap_zero (frontiers[bb]);
 338
 339   /* Do the frontier of the children first.  Not all children in the
 340      dominator tree (blocks dominated by this one) are children in the
 341      CFG, so check all blocks.  */
 342   for (c = 0; c < n_basic_blocks; ++c)
 343     if (idom[c] == bb && ! TEST_BIT (done, c))
 344       compute_dominance_frontiers_1 (frontiers, idom, c, done);
 345
 346   /* Find blocks conforming to rule (1) above.  */
 347   for (e = b->succ; e; e = e->succ_next)
 348     {
 349       if (e->dest == EXIT_BLOCK_PTR)
 350         continue;
 351       if (idom[e->dest->index] != bb)
 352         SET_BIT (frontiers[bb], e->dest->index);
 353     }
 354
 355   /* Find blocks conforming to rule (2).  */
 356   for (c = 0; c < n_basic_blocks; ++c)
 357     if (idom[c] == bb)
 358       {
 359         int x;
 360         EXECUTE_IF_SET_IN_SBITMAP (frontiers[c], 0, x,
 361           {
 362             if (idom[x] != bb)
 363               SET_BIT (frontiers[bb], x);
 364           });
 365       }
 366 }
 367
 368 static void
 369 compute_dominance_frontiers (frontiers, idom)
 370      sbitmap *frontiers;
 371      int *idom;
 372 {
 373   sbitmap done = sbitmap_alloc (n_basic_blocks);
 374   sbitmap_zero (done);
 375
 376   compute_dominance_frontiers_1 (frontiers, idom, 0, done);
 377
 378   sbitmap_free (done);
 379 }
 380
 381
 382 /* Computing the Iterated Dominance Frontier:
 383
 384    This is the set of merge points for a given register.
 385
 386    This is not particularly intuitive.  See section 7.1 of Morgan, in
 387    particular figures 7.3 and 7.4 and the immediately surrounding text.
 388 */
 389
 390 static void
 391 compute_iterated_dominance_frontiers (idfs, frontiers, evals, nregs)
 392      sbitmap *idfs;
 393      sbitmap *frontiers;
 394      sbitmap *evals;
 395      int nregs;
 396 {
 397   sbitmap worklist;
 398   int reg, passes = 0;
 399
 400   worklist = sbitmap_alloc (n_basic_blocks);
 401
 402   for (reg = 0; reg < nregs; ++reg)
 403     {
 404       sbitmap idf = idfs[reg];
 405       int b, changed;
 406
 407       /* Start the iterative process by considering those blocks that
 408          evaluate REG.  We'll add their dominance frontiers to the
 409          IDF, and then consider the blocks we just added.  */
 410       sbitmap_copy (worklist, evals[reg]);
 411
 412       /* Morgan's algorithm is incorrect here.  Blocks that evaluate
 413          REG aren't necessarily in REG's IDF.  Start with an empty IDF.  */
 414       sbitmap_zero (idf);
 415
 416       /* Iterate until the worklist is empty.  */
 417       do
 418         {
 419           changed = 0;
 420           passes++;
 421           EXECUTE_IF_SET_IN_SBITMAP (worklist, 0, b,
 422             {
 423               RESET_BIT (worklist, b);
 424               /* For each block on the worklist, add to the IDF all
 425                  blocks on its dominance frontier that aren't already
 426                  on the IDF.  Every block that's added is also added
 427                  to the worklist.  */
 428               sbitmap_union_of_diff (worklist, worklist, frontiers[b], idf);
 429               sbitmap_a_or_b (idf, idf, frontiers[b]);
 430               changed = 1;
 431             });
 432         }
 433       while (changed);
 434     }
 435
 436   sbitmap_free (worklist);
 437
 438   if (rtl_dump_file)
 439     {
 440       fprintf(rtl_dump_file,
 441               "Iterated dominance frontier: %d passes on %d regs.\n",
 442               passes, nregs);
 443     }
 444 }
 445
 446
 447 /* Insert the phi nodes.  */
 448
 449 static void
 450 insert_phi_node (regno, bb)
 451      int regno, bb;
 452 {
 453   basic_block b = BASIC_BLOCK (bb);
 454   edge e;
 455   int npred, i;
 456   rtvec vec;
 457   rtx phi, reg;
 458
 459   /* Find out how many predecessors there are.  */
 460   for (e = b->pred, npred = 0; e; e = e->pred_next)
 461     if (e->src != ENTRY_BLOCK_PTR)
 462       npred++;
 463
 464   /* If this block has no "interesting" preds, then there is nothing to
 465      do.  Consider a block that only has the entry block as a pred.  */
 466   if (npred == 0)
 467     return;
 468
 469   /* This is the register to which the phi function will be assinged.  */
 470   reg = regno_reg_rtx[regno + FIRST_PSEUDO_REGISTER];
 471
 472   /* Construct the arguments to the PHI node.  The use of pc_rtx is just
 473      a placeholder; we'll insert the proper value in rename_registers.  */
 474   vec = rtvec_alloc (npred * 2);
 475   for (e = b->pred, i = 0; e ; e = e->pred_next, i += 2)
 476     if (e->src != ENTRY_BLOCK_PTR)
 477       {
 478         RTVEC_ELT (vec, i + 0) = pc_rtx;
 479         RTVEC_ELT (vec, i + 1) = GEN_INT (e->src->index);
 480       }
 481
 482   phi = gen_rtx_PHI (VOIDmode, vec);
 483   phi = gen_rtx_SET (VOIDmode, reg, phi);
 484
 485   if (GET_CODE (b->head) == CODE_LABEL)
 486     emit_insn_after (phi, b->head);
 487   else
 488     b->head = emit_insn_before (phi, b->head);
 489 }
 490
 491
 492 static void
 493 insert_phi_nodes (idfs, evals, nregs)
 494      sbitmap *idfs;
 495      sbitmap *evals ATTRIBUTE_UNUSED;
 496      int nregs;
 497 {
 498   int reg;
 499
 500   for (reg = 0; reg < nregs; ++reg)
 501     {
 502       int b;
 503       EXECUTE_IF_SET_IN_SBITMAP (idfs[reg], 0, b,
 504         {
 505           if (REGNO_REG_SET_P (BASIC_BLOCK (b)->global_live_at_start,
 506                                reg + FIRST_PSEUDO_REGISTER))
 507             insert_phi_node (reg, b);
 508         });
 509     }
 510 }
 511
 512 /* Rename the registers to conform to SSA.
 513
 514    This is essentially the algorithm presented in Figure 7.8 of Morgan,
 515    with a few changes to reduce pattern search time in favour of a bit
 516    more memory usage.  */
 517
 518
 519 /* One of these is created for each set.  It will live in a list local
 520    to its basic block for the duration of that block's processing.  */
 521 struct rename_set_data
 522 {
 523   struct rename_set_data *next;
 524   rtx *reg_loc;
 525   rtx set_dest;
 526   rtx new_reg;
 527   rtx prev_reg;
 528   rtx set_insn;
 529 };
 530
 531 /* This struct is used to pass information to callback functions while
 532    renaming registers.  */
 533 struct rename_context
 534 {
 535   struct rename_set_data *set_data;
 536   rtx current_insn;
 537 };
 538
 539 static void new_registers_for_updates
 540   PARAMS ((struct rename_set_data *set_data,
 541            struct rename_set_data *old_set_data, rtx insn));
 542
 543 /* This is part of a rather ugly hack to allow the pre-ssa regno to be
 544    reused.  If, during processing, a register has not yet been touched,
 545    ssa_rename_to[regno] will be NULL.  Now, in the course of pushing
 546    and popping values from ssa_rename_to, when we would ordinarily
 547    pop NULL back in, we pop RENAME_NO_RTX.  We treat this exactly the
 548    same as NULL, except that it signals that the original regno has
 549    already been reused.  */
 550 #define RENAME_NO_RTX  pc_rtx
 551
 552 /* Part one of the first step of rename_block, called through for_each_rtx.
 553    Mark pseudos that are set for later update.  Transform uses of pseudos.  */
 554
 555 static int
 556 rename_insn_1 (ptr, data)
 557      rtx *ptr;
 558      void *data;
 559 {
 560   rtx x = *ptr;
 561   struct rename_context *context = data;
 562   struct rename_set_data **set_datap = &(context->set_data);
 563
 564   if (x == NULL_RTX)
 565     return 0;
 566
 567   switch (GET_CODE (x))
 568     {
 569     case SET:
 570       {
 571         rtx *destp = &SET_DEST (x);
 572         rtx dest = SET_DEST (x);
 573
 574         /* Subregs at word 0 are interesting.  Subregs at word != 0 are
 575            presumed to be part of a contiguous multi-word set sequence.  */
 576         while (GET_CODE (dest) == SUBREG
 577                && SUBREG_WORD (dest) == 0)
 578           {
 579             destp = &SUBREG_REG (dest);
 580             dest = SUBREG_REG (dest);
 581           }
 582
 583         if (GET_CODE (dest) == REG
 584             && REGNO (dest) >= FIRST_PSEUDO_REGISTER)
 585           {
 586             /* We found a genuine set of an interesting register.  Tag
 587                it so that we can create a new name for it after we finish
 588                processing this insn.  */
 589
 590             struct rename_set_data *r;
 591             r = (struct rename_set_data *) xmalloc (sizeof(*r));
 592
 593             r->reg_loc = destp;
 594             r->set_dest = SET_DEST (x);
 595             r->set_insn = context->current_insn;
 596             r->next = *set_datap;
 597             *set_datap = r;
 598
 599             /* Since we do not wish to (directly) traverse the
 600                SET_DEST, recurse through for_each_rtx for the SET_SRC
 601                and return.  */
 602             for_each_rtx (&SET_SRC (x), rename_insn_1, data);
 603             return -1;
 604           }
 605
 606         /* Otherwise, this was not an interesting destination.  Continue
 607            on, marking uses as normal.  */
 608         return 0;
 609       }
 610
 611     case REG:
 612       if (REGNO (x) >= FIRST_PSEUDO_REGISTER
 613           && REGNO (x) < ssa_max_reg_num)
 614         {
 615           rtx new_reg = ssa_rename_to[REGNO(x) - FIRST_PSEUDO_REGISTER];
 616
 617           if (new_reg != NULL_RTX && new_reg != RENAME_NO_RTX)
 618             {
 619               if (GET_MODE (x) != GET_MODE (new_reg))
 620                 abort ();
 621               *ptr = new_reg;
 622             }
 623           /* Else this is a use before a set.  Warn?  */
 624         }
 625       return -1;
 626
 627     case PHI:
 628       /* Never muck with the phi.  We do that elsewhere, special-like.  */
 629       return -1;
 630
 631     default:
 632       /* Anything else, continue traversing.  */
 633       return 0;
 634     }
 635 }
 636
 637 /* Second part of the first step of rename_block.  The portion of the list
 638    beginning at SET_DATA through OLD_SET_DATA contain the sets present in
 639    INSN.  Update data structures accordingly.  */
 640
 641 static void
 642 new_registers_for_updates (set_data, old_set_data, insn)
 643      struct rename_set_data *set_data, *old_set_data;
 644      rtx insn;
 645 {
 646   while (set_data != old_set_data)
 647     {
 648       int regno, new_regno;
 649       rtx old_reg, new_reg, prev_reg;
 650
 651       old_reg = *set_data->reg_loc;
 652       regno = REGNO (*set_data->reg_loc);
 653
 654       /* For the first set we come across, reuse the original regno.  */
 655       if (ssa_rename_to[regno - FIRST_PSEUDO_REGISTER] == NULL_RTX)
 656         {
 657           new_reg = old_reg;
 658           prev_reg = RENAME_NO_RTX;
 659         }
 660       else
 661         {
 662           prev_reg = ssa_rename_to[regno - FIRST_PSEUDO_REGISTER];
 663           new_reg = gen_reg_rtx (GET_MODE (old_reg));
 664         }
 665
 666       set_data->new_reg = new_reg;
 667       set_data->prev_reg = prev_reg;
 668       new_regno = REGNO (new_reg);
 669       ssa_rename_to[regno - FIRST_PSEUDO_REGISTER] = new_reg;
 670
 671       if (new_regno >= (int) ssa_definition->num_elements)
 672         {
 673           int new_limit = new_regno * 5 / 4;
 674           ssa_definition = VARRAY_GROW (ssa_definition, new_limit);
 675           ssa_uses = VARRAY_GROW (ssa_uses, new_limit);
 676           ssa_rename_from = VARRAY_GROW (ssa_rename_from, new_limit);
 677         }
 678
 679       VARRAY_RTX (ssa_definition, new_regno) = insn;
 680       VARRAY_RTX (ssa_rename_from, new_regno) = old_reg;
 681
 682       set_data = set_data->next;
 683     }
 684 }
 685
 686 static void
 687 rename_block (bb, idom)
 688      int bb;
 689      int *idom;
 690 {
 691   basic_block b = BASIC_BLOCK (bb);
 692   edge e;
 693   rtx insn, next, last;
 694   struct rename_set_data *set_data = NULL;
 695   int c;
 696
 697   /* Step One: Walk the basic block, adding new names for sets and
 698      replacing uses.  */
 699
 700   next = b->head;
 701   last = b->end;
 702   do
 703     {
 704       insn = next;
 705       if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
 706         {
 707           struct rename_context context;
 708           context.set_data = set_data;
 709           context.current_insn = insn;
 710
 711           for_each_rtx (&PATTERN (insn), rename_insn_1, &context);
 712           for_each_rtx (&REG_NOTES (insn), rename_insn_1, &context);
 713
 714           new_registers_for_updates (context.set_data, set_data, insn);
 715           set_data = context.set_data;
 716         }
 717
 718       next = NEXT_INSN (insn);
 719     }
 720   while (insn != last);
 721
 722   /* Step Two: Update the phi nodes of this block's successors.  */
 723
 724   for (e = b->succ; e; e = e->succ_next)
 725     {
 726       if (e->dest == EXIT_BLOCK_PTR)
 727         continue;
 728
 729       insn = e->dest->head;
 730       if (GET_CODE (insn) == CODE_LABEL)
 731         insn = NEXT_INSN (insn);
 732
 733       while (PHI_NODE_P (insn))
 734         {
 735           rtx phi = PATTERN (insn);
 736           unsigned int regno;
 737           rtx reg;
 738
 739           /* Find out which of our outgoing registers this node is
 740              indended to replace.  Note that if this not the first PHI
 741              node to have been created for this register, we have to
 742              jump through rename links to figure out which register
 743              we're talking about.  This can easily be recognized by
 744              noting that the regno is new to this pass.  */
 745           regno = REGNO (SET_DEST (phi));
 746           if (regno >= ssa_max_reg_num)
 747             regno = REGNO (VARRAY_RTX (ssa_rename_from, regno));
 748           reg = ssa_rename_to[regno - FIRST_PSEUDO_REGISTER];
 749
 750           /* It is possible for the variable to be uninitialized on
 751              edges in.  Reduce the arity of the PHI so that we don't
 752              consider those edges.  */
 753           if (reg == NULL || reg == RENAME_NO_RTX)
 754             {
 755               if (! remove_phi_alternative (phi, bb))
 756                 abort ();
 757             }
 758           else
 759             {
 760               /* When we created the PHI nodes, we did not know what mode
 761              the register should be.  Now that we've found an original,
 762              we can fill that in.  */
 763               if (GET_MODE (SET_DEST (phi)) == VOIDmode)
 764                 PUT_MODE (SET_DEST (phi), GET_MODE (reg));
 765               else if (GET_MODE (SET_DEST (phi)) != GET_MODE (reg))
 766                 abort();
 767
 768               *phi_alternative (phi, bb) = reg;
 769               /* ??? Mark for a new ssa_uses entry.  */
 770             }
 771
 772           insn = NEXT_INSN (insn);
 773         }
 774     }
 775
 776   /* Step Three: Do the same to the children of this block in
 777      dominator order.  */
 778
 779   for (c = 0; c < n_basic_blocks; ++c)
 780     if (idom[c] == bb)
 781       rename_block (c, idom);
 782
 783   /* Step Four: Update the sets to refer to their new register.  */
 784
 785   while (set_data)
 786     {
 787       struct rename_set_data *next;
 788       rtx old_reg = *set_data->reg_loc;
 789
 790       /* If the set is of a subreg only, copy the entire reg first so
 791          that unmodified bits are preserved.  Of course, we don't
 792          strictly have SSA any more, but that's the best we can do
 793          without a lot of hard work.  */
 794
 795       if (GET_CODE (set_data->set_dest) == SUBREG)
 796         {
 797           if (old_reg != set_data->new_reg)
 798             {
 799               rtx copy = gen_rtx_SET (GET_MODE (old_reg),
 800                                       set_data->new_reg, old_reg);
 801               emit_insn_before (copy, set_data->set_insn);
 802             }
 803         }
 804
 805       *set_data->reg_loc = set_data->new_reg;
 806       ssa_rename_to[REGNO (old_reg)-FIRST_PSEUDO_REGISTER]
 807         = set_data->prev_reg;
 808
 809       next = set_data->next;
 810       free (set_data);
 811       set_data = next;
 812     }
 813 }
 814
 815 static void
 816 rename_registers (nregs, idom)
 817      int nregs;
 818      int *idom;
 819 {
 820   VARRAY_RTX_INIT (ssa_definition, nregs * 3, "ssa_definition");
 821   VARRAY_RTX_INIT (ssa_uses, nregs * 3, "ssa_uses");
 822   VARRAY_RTX_INIT (ssa_rename_from, nregs * 3, "ssa_rename_from");
 823
 824   ssa_rename_to = (rtx *) alloca (nregs * sizeof(rtx));
 825   bzero ((char *) ssa_rename_to, nregs * sizeof(rtx));
 826
 827   rename_block (0, idom);
 828
 829   /* ??? Update basic_block_live_at_start, and other flow info
 830      as needed.  */
 831
 832   ssa_rename_to = NULL;
 833 }
 834
 835
 836 /* The main entry point for moving to SSA.  */
 837
 838 void
 839 convert_to_ssa()
 840 {
 841   /* Element I is the set of blocks that set register I.  */
 842   sbitmap *evals;
 843
 844   /* Dominator bitmaps.  */
 845   sbitmap *dominators;
 846   sbitmap *dfs;
 847   sbitmap *idfs;
 848
 849   /* Element I is the immediate dominator of block I.  */
 850   int *idom;
 851
 852   int nregs;
 853
 854   /* Don't do it twice.  */
 855   if (in_ssa_form)
 856     abort ();
 857
 858   /* Need global_live_at_{start,end} up to date.  */
 859   life_analysis (get_insns (), NULL, PROP_KILL_DEAD_CODE | PROP_SCAN_DEAD_CODE);
 860
 861   /* Compute dominators.  */
 862   dominators = sbitmap_vector_alloc (n_basic_blocks, n_basic_blocks);
 863   compute_flow_dominators (dominators, NULL);
 864
 865   idom = (int *) alloca (n_basic_blocks * sizeof (int));
 866   memset ((void *)idom, -1, (size_t)n_basic_blocks * sizeof (int));
 867   simplify_to_immediate_dominators (idom, dominators);
 868
 869   sbitmap_vector_free (dominators);
 870
 871   if (rtl_dump_file)
 872     {
 873       int i;
 874       fputs (";; Immediate Dominators:\n", rtl_dump_file);
 875       for (i = 0; i < n_basic_blocks; ++i)
 876         fprintf (rtl_dump_file, ";\t%3d = %3d\n", i, idom[i]);
 877       fflush (rtl_dump_file);
 878     }
 879
 880   /* Compute dominance frontiers.  */
 881
 882   dfs = sbitmap_vector_alloc (n_basic_blocks, n_basic_blocks);
 883   compute_dominance_frontiers (dfs, idom);
 884
 885   if (rtl_dump_file)
 886     {
 887       dump_sbitmap_vector (rtl_dump_file, ";; Dominance Frontiers:",
 888                            "; Basic Block", dfs, n_basic_blocks);
 889       fflush (rtl_dump_file);
 890     }
 891
 892   /* Compute register evaluations.  */
 893
 894   ssa_max_reg_num = max_reg_num();
 895   nregs = ssa_max_reg_num - FIRST_PSEUDO_REGISTER;
 896   evals = sbitmap_vector_alloc (nregs, n_basic_blocks);
 897   find_evaluations (evals, nregs);
 898
 899   /* Compute the iterated dominance frontier for each register.  */
 900
 901   idfs = sbitmap_vector_alloc (nregs, n_basic_blocks);
 902   compute_iterated_dominance_frontiers (idfs, dfs, evals, nregs);
 903
 904   if (rtl_dump_file)
 905     {
 906       dump_sbitmap_vector (rtl_dump_file, ";; Iterated Dominance Frontiers:",
 907                            "; Register-FIRST_PSEUDO_REGISTER", idfs, nregs);
 908       fflush (rtl_dump_file);
 909     }
 910
 911   /* Insert the phi nodes.  */
 912
 913   insert_phi_nodes (idfs, evals, nregs);
 914
 915   /* Rename the registers to satisfy SSA.  */
 916
 917   rename_registers (nregs, idom);
 918
 919   /* All done!  Clean up and go home.  */
 920
 921   sbitmap_vector_free (dfs);
 922   sbitmap_vector_free (evals);
 923   sbitmap_vector_free (idfs);
 924   in_ssa_form = 1;
 925
 926   reg_scan (get_insns (), max_reg_num (), 1);
 927 }
 928
 929
 930 /* REG is the representative temporary of its partition.  Add it to the
 931    set of nodes to be processed, if it hasn't been already.  Return the
 932    index of this register in the node set.  */
 933
 934 static inline int
 935 ephi_add_node (reg, nodes, n_nodes)
 936      rtx reg, *nodes;
 937      int *n_nodes;
 938 {
 939   int i;
 940   for (i = *n_nodes - 1; i >= 0; --i)
 941     if (REGNO (reg) == REGNO (nodes[i]))
 942       return i;
 943
 944   nodes[i = (*n_nodes)++] = reg;
 945   return i;
 946 }
 947
 948 /* Part one of the topological sort.  This is a forward (downward) search
 949    through the graph collecting a stack of nodes to process.  Assuming no
 950    cycles, the nodes at top of the stack when we are finished will have
 951    no other dependancies.  */
 952
 953 static int *
 954 ephi_forward (t, visited, succ, tstack)
 955      int t;
 956      sbitmap visited;
 957      sbitmap *succ;
 958      int *tstack;
 959 {
 960   int s;
 961
 962   SET_BIT (visited, t);
 963
 964   EXECUTE_IF_SET_IN_SBITMAP (succ[t], 0, s,
 965     {
 966       if (! TEST_BIT (visited, s))
 967         tstack = ephi_forward (s, visited, succ, tstack);
 968     });
 969
 970   *tstack++ = t;
 971   return tstack;
 972 }
 973
 974 /* Part two of the topological sort.  The is a backward search through
 975    a cycle in the graph, copying the data forward as we go.  */
 976
 977 static void
 978 ephi_backward (t, visited, pred, nodes)
 979      int t;
 980      sbitmap visited, *pred;
 981      rtx *nodes;
 982 {
 983   int p;
 984
 985   SET_BIT (visited, t);
 986
 987   EXECUTE_IF_SET_IN_SBITMAP (pred[t], 0, p,
 988     {
 989       if (! TEST_BIT (visited, p))
 990         {
 991           ephi_backward (p, visited, pred, nodes);
 992           emit_move_insn (nodes[p], nodes[t]);
 993         }
 994     });
 995 }
 996
 997 /* Part two of the topological sort.  Create the copy for a register
 998    and any cycle of which it is a member.  */
 999
1000 static void
1001 ephi_create (t, visited, pred, succ, nodes)
1002      int t;
1003      sbitmap visited, *pred, *succ;
1004      rtx *nodes;
1005 {
1006   rtx reg_u = NULL_RTX;
1007   int unvisited_predecessors = 0;
1008   int p;
1009
1010   /* Iterate through the predecessor list looking for unvisited nodes.
1011      If there are any, we have a cycle, and must deal with that.  At
1012      the same time, look for a visited predecessor.  If there is one,
1013      we won't need to create a temporary.  */
1014
1015   EXECUTE_IF_SET_IN_SBITMAP (pred[t], 0, p,
1016     {
1017       if (! TEST_BIT (visited, p))
1018         unvisited_predecessors = 1;
1019       else if (!reg_u)
1020         reg_u = nodes[p];
1021     });
1022
1023   if (unvisited_predecessors)
1024     {
1025       /* We found a cycle.  Copy out one element of the ring (if necessary),
1026          then traverse the ring copying as we go.  */
1027
1028       if (!reg_u)
1029         {
1030           reg_u = gen_reg_rtx (GET_MODE (nodes[t]));
1031           emit_move_insn (reg_u, nodes[t]);
1032         }
1033
1034       EXECUTE_IF_SET_IN_SBITMAP (pred[t], 0, p,
1035         {
1036           if (! TEST_BIT (visited, p))
1037             {
1038               ephi_backward (p, visited, pred, nodes);
1039               emit_move_insn (nodes[p], reg_u);
1040             }
1041         });
1042     }
1043   else
1044     {
1045       /* No cycle.  Just copy the value from a successor.  */
1046
1047       int s;
1048       EXECUTE_IF_SET_IN_SBITMAP (succ[t], 0, s,
1049         {
1050           SET_BIT (visited, t);
1051           emit_move_insn (nodes[t], nodes[s]);
1052           return;
1053         });
1054     }
1055 }
1056
1057 /* Convert the edge to normal form.  */
1058
1059 static void
1060 eliminate_phi (e, reg_partition)
1061      edge e;
1062      partition reg_partition;
1063 {
1064   int n_nodes;
1065   sbitmap *pred, *succ;
1066   sbitmap visited;
1067   rtx *nodes;
1068   int *stack, *tstack;
1069   rtx insn;
1070   int i;
1071
1072   /* Collect an upper bound on the number of registers needing processing.  */
1073
1074   insn = e->dest->head;
1075   if (GET_CODE (insn) == CODE_LABEL)
1076     insn = next_nonnote_insn (insn);
1077
1078   n_nodes = 0;
1079   while (PHI_NODE_P (insn))
1080     {
1081       insn = next_nonnote_insn (insn);
1082       n_nodes += 2;
1083     }
1084
1085   if (n_nodes == 0)
1086     return;
1087
1088   /* Build the auxilliary graph R(B).
1089
1090      The nodes of the graph are the members of the register partition
1091      present in Phi(B).  There is an edge from FIND(T0)->FIND(T1) for
1092      each T0 = PHI(...,T1,...), where T1 is for the edge from block C.  */
1093
1094   nodes = (rtx *) alloca (n_nodes * sizeof(rtx));
1095   pred = sbitmap_vector_alloc (n_nodes, n_nodes);
1096   succ = sbitmap_vector_alloc (n_nodes, n_nodes);
1097   sbitmap_vector_zero (pred, n_nodes);
1098   sbitmap_vector_zero (succ, n_nodes);
1099
1100   insn = e->dest->head;
1101   if (GET_CODE (insn) == CODE_LABEL)
1102     insn = next_nonnote_insn (insn);
1103
1104   n_nodes = 0;
1105   for (; PHI_NODE_P (insn); insn = next_nonnote_insn (insn))
1106     {
1107       rtx* preg = phi_alternative (PATTERN (insn), e->src->index);
1108       rtx tgt = SET_DEST (PATTERN (insn));
1109       rtx reg;
1110
1111       /* There may be no phi alternative corresponding to this edge.
1112          This indicates that the phi variable is undefined along this
1113          edge.  */
1114       if (preg == NULL)
1115         continue;
1116       reg = *preg;
1117
1118       if (GET_CODE (reg) != REG || GET_CODE (tgt) != REG)
1119         abort();
1120
1121       reg = regno_reg_rtx[partition_find (reg_partition, REGNO (reg))];
1122       tgt = regno_reg_rtx[partition_find (reg_partition, REGNO (tgt))];
1123       /* If the two registers are already in the same partition,
1124          nothing will need to be done.  */
1125       if (reg != tgt)
1126         {
1127           int ireg, itgt;
1128
1129           ireg = ephi_add_node (reg, nodes, &n_nodes);
1130           itgt = ephi_add_node (tgt, nodes, &n_nodes);
1131
1132           SET_BIT (pred[ireg], itgt);
1133           SET_BIT (succ[itgt], ireg);
1134         }
1135     }
1136
1137   if (n_nodes == 0)
1138     goto out;
1139
1140   /* Begin a topological sort of the graph.  */
1141
1142   visited = sbitmap_alloc (n_nodes);
1143   sbitmap_zero (visited);
1144
1145   tstack = stack = (int *) alloca (n_nodes * sizeof (int));
1146
1147   for (i = 0; i < n_nodes; ++i)
1148     if (! TEST_BIT (visited, i))
1149       tstack = ephi_forward (i, visited, succ, tstack);
1150
1151   sbitmap_zero (visited);
1152
1153   /* As we find a solution to the tsort, collect the implementation
1154      insns in a sequence.  */
1155   start_sequence ();
1156
1157   while (tstack != stack)
1158     {
1159       i = *--tstack;
1160       if (! TEST_BIT (visited, i))
1161         ephi_create (i, visited, pred, succ, nodes);
1162     }
1163
1164   insn = gen_sequence ();
1165   end_sequence ();
1166   insert_insn_on_edge (insn, e);
1167   if (rtl_dump_file)
1168     fprintf (rtl_dump_file, "Emitting copy on edge (%d,%d)\n",
1169              e->src->index, e->dest->index);
1170
1171   sbitmap_free (visited);
1172 out:
1173   sbitmap_vector_free (pred);
1174   sbitmap_vector_free (succ);
1175 }
1176
1177
1178 /* For basic block B, consider all phi insns which provide an
1179    alternative corresponding to an incoming abnormal critical edge.
1180    Place the phi alternative corresponding to that abnormal critical
1181    edge in the same register class as the destination of the set.
1182
1183    From Morgan, p. 178:
1184
1185      For each abnormal critical edge (C, B),
1186      if T0 = phi (T1, ..., Ti, ..., Tm) is a phi node in B,
1187      and C is the ith predecessor of B,
1188      then T0 and Ti must be equivalent.
1189
1190    Return non-zero iff any such cases were found for which the two
1191    regs were not already in the same class.  */
1192
1193 static int
1194 make_regs_equivalent_over_bad_edges (bb, reg_partition)
1195      int bb;
1196      partition reg_partition;
1197 {
1198   int changed = 0;
1199   basic_block b = BASIC_BLOCK (bb);
1200   rtx phi = b->head;
1201
1202   /* Advance to the first phi node.  */
1203   if (GET_CODE (phi) == CODE_LABEL)
1204     phi = next_nonnote_insn (phi);
1205
1206   /* Scan all the phi nodes.  */
1207   for (;
1208        PHI_NODE_P (phi);
1209        phi = next_nonnote_insn (phi))
1210     {
1211       edge e;
1212       int tgt_regno;
1213       rtx set = PATTERN (phi);
1214       rtx tgt = SET_DEST (set);
1215
1216       /* The set target is expected to be a pseudo.  */
1217       if (GET_CODE (tgt) != REG
1218           || REGNO (tgt) < FIRST_PSEUDO_REGISTER)
1219         abort ();
1220       tgt_regno = REGNO (tgt);
1221
1222       /* Scan incoming abnormal critical edges.  */
1223       for (e = b->pred; e; e = e->pred_next)
1224         if (e->flags & (EDGE_ABNORMAL | EDGE_CRITICAL))
1225           {
1226             rtx *alt = phi_alternative (set, e->src->index);
1227             int alt_regno;
1228
1229             /* If there is no alternative corresponding to this edge,
1230                the value is undefined along the edge, so just go on.  */
1231             if (alt == 0)
1232               continue;
1233
1234             /* The phi alternative is expected to be a pseudo.  */
1235             if (GET_CODE (*alt) != REG
1236                 || REGNO (*alt) < FIRST_PSEUDO_REGISTER)
1237               abort ();
1238             alt_regno = REGNO (*alt);
1239
1240             /* If the set destination and the phi alternative aren't
1241                already in the same class...  */
1242             if (partition_find (reg_partition, tgt_regno)
1243                 != partition_find (reg_partition, alt_regno))
1244               {
1245                 /* ... make them such.  */
1246                 partition_union (reg_partition,
1247                                  tgt_regno, alt_regno);
1248                 ++changed;
1249               }
1250           }
1251     }
1252
1253   return changed;
1254 }
1255
1256
1257 /* Consider phi insns in basic block BB pairwise.  If the set target
1258    of both isns are equivalent pseudos, make the corresponding phi
1259    alternatives in each phi corresponding equivalent.
1260
1261    Return nonzero if any new register classes were unioned.  */
1262
1263 static int
1264 make_equivalent_phi_alternatives_equivalent (bb, reg_partition)
1265      int bb;
1266      partition reg_partition;
1267 {
1268   int changed = 0;
1269   rtx phi = BLOCK_HEAD (bb);
1270   basic_block b = BASIC_BLOCK (bb);
1271
1272   /* Advance to the first phi node.  */
1273   if (GET_CODE (phi) == CODE_LABEL)
1274     phi = next_nonnote_insn (phi);
1275
1276   /* Scan all the phi nodes.  */
1277   for (;
1278        PHI_NODE_P (phi);
1279        phi = next_nonnote_insn (phi))
1280     {
1281       rtx set = PATTERN (phi);
1282       /* The regno of the destination of the set.  */
1283       int tgt_regno = REGNO (SET_DEST (PATTERN (phi)));
1284
1285       rtx phi2 = next_nonnote_insn (phi);
1286
1287       /* Scan all phi nodes following this one.  */
1288       for (;
1289            PHI_NODE_P (phi2);
1290            phi2 = next_nonnote_insn (phi2))
1291         {
1292           rtx set2 = PATTERN (phi2);
1293           /* The regno of the destination of the set.  */
1294           int tgt2_regno = REGNO (SET_DEST (set2));
1295
1296           /* Are the set destinations equivalent regs?  */
1297           if (partition_find (reg_partition, tgt_regno) ==
1298               partition_find (reg_partition, tgt2_regno))
1299             {
1300               edge e;
1301               /* Scan over edges.  */
1302               for (e = b->pred; e; e = e->pred_next)
1303                 {
1304                   int pred_block = e->src->index;
1305                   /* Identify the phi altnernatives from both phi
1306                      nodes corresponding to this edge.  */
1307                   rtx *alt = phi_alternative (set, pred_block);
1308                   rtx *alt2 = phi_alternative (set2, pred_block);
1309
1310                   /* If one of the phi nodes doesn't have a
1311                      corresponding alternative, just skip it.  */
1312                   if (alt == 0 || alt2 == 0)
1313                     continue;
1314
1315                   /* Both alternatives should be pseudos.  */
1316                   if (GET_CODE (*alt) != REG
1317                       || REGNO (*alt) < FIRST_PSEUDO_REGISTER)
1318                     abort ();
1319                   if (GET_CODE (*alt2) != REG
1320                       || REGNO (*alt2) < FIRST_PSEUDO_REGISTER)
1321                     abort ();
1322
1323                   /* If the altneratives aren't already in the same
1324                      class ... */
1325                   if (partition_find (reg_partition, REGNO (*alt))
1326                       != partition_find (reg_partition, REGNO (*alt2)))
1327                     {
1328                       /* ... make them so.  */
1329                       partition_union (reg_partition,
1330                                        REGNO (*alt), REGNO (*alt2));
1331                       ++changed;
1332                     }
1333                 }
1334             }
1335         }
1336     }
1337
1338   return changed;
1339 }
1340
1341 /* Compute a conservative partition of outstanding pseudo registers.
1342    See Morgan 7.3.1.  */
1343
1344 static partition
1345 compute_conservative_reg_partition ()
1346 {
1347   int bb;
1348   int changed = 0;
1349
1350   /* We don't actually work with hard registers, but it's easier to
1351      carry them around anyway rather than constantly doing register
1352      number arithmetic.  */
1353   partition p =
1354     partition_new (ssa_definition->num_elements + FIRST_PSEUDO_REGISTER);
1355
1356   /* The first priority is to make sure registers that might have to
1357      be copied on abnormal critical edges are placed in the same
1358      partition.  This saves us from having to split abnormal critical
1359      edges.  */
1360   for (bb = n_basic_blocks; --bb >= 0; )
1361     changed += make_regs_equivalent_over_bad_edges (bb, p);
1362
1363   /* Now we have to insure that corresponding arguments of phi nodes
1364      assigning to corresponding regs are equivalent.  Iterate until
1365      nothing changes.  */
1366   while (changed > 0)
1367     {
1368       changed = 0;
1369       for (bb = n_basic_blocks; --bb >= 0; )
1370         changed += make_equivalent_phi_alternatives_equivalent (bb, p);
1371     }
1372
1373   return p;
1374 }
1375
1376 /* The following functions compute a register partition that attempts
1377    to eliminate as many reg copies and phi node copies as possible by
1378    coalescing registers.   This is the strategy:
1379
1380     1. As in the conservative case, the top priority is to coalesce
1381        registers that otherwise would cause copies to be placed on
1382        abnormal critical edges (which isn't possible).
1383
1384     2. Figure out which regs are involved (in the LHS or RHS) of
1385        copies and phi nodes.  Compute conflicts among these regs.
1386
1387     3. Walk around the instruction stream, placing two regs in the
1388        same class of the partition if one appears on the LHS and the
1389        other on the RHS of a copy or phi node and the two regs don't
1390        conflict.  The conflict information of course needs to be
1391        updated.
1392
1393     4. If anything has changed, there may be new opportunities to
1394        coalesce regs, so go back to 2.
1395 */
1396
1397 /* If REG1 and REG2 don't conflict in CONFLICTS, place them in the
1398    same class of partition P, if they aren't already.  Update
1399    CONFLICTS appropriately.
1400
1401    Returns one if REG1 and REG2 were placed in the same class but were
1402    not previously; zero otherwise.
1403
1404    See Morgan figure 11.15.  */
1405
1406 static int
1407 coalesce_if_unconflicting (p, conflicts, reg1, reg2)
1408      partition p;
1409      conflict_graph conflicts;
1410      int reg1;
1411      int reg2;
1412 {
1413   int reg;
1414
1415   /* Don't mess with hard regs.  */
1416   if (reg1 < FIRST_PSEUDO_REGISTER || reg2 < FIRST_PSEUDO_REGISTER)
1417     return 0;
1418
1419   /* Find the canonical regs for the classes containing REG1 and
1420      REG2.  */
1421   reg1 = partition_find (p, reg1);
1422   reg2 = partition_find (p, reg2);
1423
1424   /* If they're already in the same class, there's nothing to do.  */
1425   if (reg1 == reg2)
1426     return 0;
1427
1428   /* If the regs conflict, our hands are tied.  */
1429   if (conflict_graph_conflict_p (conflicts, reg1, reg2))
1430     return 0;
1431
1432   /* We're good to go.  Put the regs in the same partition.  */
1433   partition_union (p, reg1, reg2);
1434
1435   /* Find the new canonical reg for the merged class.  */
1436   reg = partition_find (p, reg1);
1437
1438   /* Merge conflicts from the two previous classes.  */
1439   conflict_graph_merge_regs (conflicts, reg, reg1);
1440   conflict_graph_merge_regs (conflicts, reg, reg2);
1441
1442   return 1;
1443 }
1444
1445 /* For each register copy insn in basic block BB, place the LHS and
1446    RHS regs in the same class in partition P if they do not conflict
1447    according to CONFLICTS.
1448
1449    Returns the number of changes that were made to P.
1450
1451    See Morgan figure 11.14.  */
1452
1453 static int
1454 coalesce_regs_in_copies (bb, p, conflicts)
1455      basic_block bb;
1456      partition p;
1457      conflict_graph conflicts;
1458 {
1459   int changed = 0;
1460   rtx insn;
1461   rtx end = bb->end;
1462
1463   /* Scan the instruction stream of the block.  */
1464   for (insn = bb->head; insn != end; insn = NEXT_INSN (insn))
1465     {
1466       rtx pattern;
1467       rtx src;
1468       rtx dest;
1469
1470       /* If this isn't a set insn, go to the next insn.  */
1471       if (GET_CODE (insn) != INSN)
1472         continue;
1473       pattern = PATTERN (insn);
1474       if (GET_CODE (pattern) != SET)
1475         continue;
1476
1477       src = SET_SRC (pattern);
1478       dest = SET_DEST (pattern);
1479
1480       /* If src or dest are subregs, find the underlying reg.  */
1481       while (GET_CODE (src) == SUBREG
1482              && SUBREG_WORD (src) != 0)
1483         src = SUBREG_REG (src);
1484       while (GET_CODE (dest) == SUBREG
1485              && SUBREG_WORD (dest) != 0)
1486         dest = SUBREG_REG (dest);
1487
1488       /* We're only looking for copies.  */
1489       if (GET_CODE (src) != REG || GET_CODE (dest) != REG)
1490         continue;
1491
1492       /* Coalesce only if the reg modes are the same.  As long as
1493          each reg's rtx is unique, it can have only one mode, so two
1494          pseudos of different modes can't be coalesced into one.
1495
1496          FIXME: We can probably get around this by inserting SUBREGs
1497          where appropriate, but for now we don't bother.  */
1498       if (GET_MODE (src) != GET_MODE (dest))
1499         continue;
1500
1501       /* Found a copy; see if we can use the same reg for both the
1502          source and destination (and thus eliminate the copy,
1503          ultimately).  */
1504       changed += coalesce_if_unconflicting (p, conflicts,
1505                                             REGNO (src), REGNO (dest));
1506     }
1507
1508   return changed;
1509 }
1510
1511
1512 struct phi_coalesce_context
1513 {
1514   partition p;
1515   conflict_graph conflicts;
1516   int changed;
1517 };
1518
1519 /* Callback function for for_each_successor_phi.  If the set
1520    destination and the phi alternative regs do not conflict, place
1521    them in the same paritition class.  DATA is a pointer to a
1522    phi_coalesce_context struct.  */
1523
1524 static int
1525 coalesce_reg_in_phi (insn, dest_regno, src_regno, data)
1526      rtx insn ATTRIBUTE_UNUSED;
1527      int dest_regno;
1528      int src_regno;
1529      void *data;
1530 {
1531   struct phi_coalesce_context *context =
1532     (struct phi_coalesce_context *) data;
1533
1534   /* Attempt to use the same reg, if they don't conflict.  */
1535   context->changed
1536     += coalesce_if_unconflicting (context->p, context->conflicts,
1537                                   dest_regno, src_regno);
1538   return 0;
1539 }
1540
1541 /* For each alternative in a phi function corresponding to basic block
1542    BB (in phi nodes in successor block to BB), place the reg in the
1543    phi alternative and the reg to which the phi value is set into the
1544    same class in partition P, if allowed by CONFLICTS.
1545
1546    Return the number of changes that were made to P.
1547
1548    See Morgan figure 11.14.  */
1549
1550 static int
1551 coalesce_regs_in_successor_phi_nodes (bb, p, conflicts)
1552      basic_block bb;
1553      partition p;
1554      conflict_graph conflicts;
1555 {
1556   struct phi_coalesce_context context;
1557   context.p = p;
1558   context.conflicts = conflicts;
1559   context.changed = 0;
1560
1561   for_each_successor_phi (bb, &coalesce_reg_in_phi, &context);
1562
1563   return context.changed;
1564 }
1565
1566 /* Compute and return a partition of pseudos.  Where possible,
1567    non-conflicting pseudos are placed in the same class.
1568
1569    The caller is responsible for deallocating the returned partition.  */
1570
1571 static partition
1572 compute_coalesced_reg_partition ()
1573 {
1574   int bb;
1575   int changed = 0;
1576
1577   /* We don't actually work with hard registers, but it's easier to
1578      carry them around anyway rather than constantly doing register
1579      number arithmetic.  */
1580   partition p =
1581     partition_new (ssa_definition->num_elements + FIRST_PSEUDO_REGISTER);
1582
1583   /* The first priority is to make sure registers that might have to
1584      be copied on abnormal critical edges are placed in the same
1585      partition.  This saves us from having to split abnormal critical
1586      edges (which can't be done).  */
1587   for (bb = n_basic_blocks; --bb >= 0; )
1588     make_regs_equivalent_over_bad_edges (bb, p);
1589
1590   do
1591     {
1592       regset_head phi_set;
1593       conflict_graph conflicts;
1594
1595       changed = 0;
1596
1597       /* Build the set of registers involved in phi nodes, either as
1598          arguments to the phi function or as the target of a set.  */
1599       INITIALIZE_REG_SET (phi_set);
1600       mark_phi_and_copy_regs (&phi_set);
1601
1602       /* Compute conflicts.  */
1603       conflicts = conflict_graph_compute (&phi_set, p);
1604
1605       /* FIXME: Better would be to process most frequently executed
1606          blocks first, so that most frequently executed copies would
1607          be more likely to be removed by register coalescing.  But any
1608          order will generate correct, if non-optimal, results.  */
1609       for (bb = n_basic_blocks; --bb >= 0; )
1610         {
1611           basic_block block = BASIC_BLOCK (bb);
1612           changed += coalesce_regs_in_copies (block, p, conflicts);
1613           changed +=
1614             coalesce_regs_in_successor_phi_nodes (block, p, conflicts);
1615         }
1616
1617       conflict_graph_delete (conflicts);
1618     }
1619   while (changed > 0);
1620
1621   return p;
1622 }
1623
1624 /* Mark the regs in a phi node.  PTR is a phi expression or one of its
1625    components (a REG or a CONST_INT).  DATA is a reg set in which to
1626    set all regs.  Called from for_each_rtx.  */
1627
1628 static int
1629 mark_reg_in_phi (ptr, data)
1630      rtx *ptr;
1631      void *data;
1632 {
1633   rtx expr = *ptr;
1634   regset set = (regset) data;
1635
1636   switch (GET_CODE (expr))
1637     {
1638     case REG:
1639       SET_REGNO_REG_SET (set, REGNO (expr));
1640       /* Fall through.  */
1641     case CONST_INT:
1642     case PHI:
1643       return 0;
1644     default:
1645       abort ();
1646     }
1647 }
1648
1649 /* Mark in PHI_SET all pseudos that are used in a phi node -- either
1650    set from a phi expression, or used as an argument in one.  Also
1651    mark regs that are the source or target of a reg copy.  Uses
1652    ssa_definition.  */
1653
1654 static void
1655 mark_phi_and_copy_regs (phi_set)
1656      regset phi_set;
1657 {
1658   int reg;
1659
1660   /* Scan the definitions of all regs.  */
1661   for (reg = VARRAY_SIZE (ssa_definition);
1662        --reg >= FIRST_PSEUDO_REGISTER;
1663        )
1664     {
1665       rtx insn = VARRAY_RTX (ssa_definition, reg);
1666       rtx pattern;
1667       rtx src;
1668
1669       if (insn == NULL)
1670         continue;
1671       pattern = PATTERN (insn);
1672       /* Sometimes we get PARALLEL insns.  These aren't phi nodes or
1673          copies.  */
1674       if (GET_CODE (pattern) != SET)
1675         continue;
1676       src = SET_SRC (pattern);
1677
1678       if (GET_CODE (src) == REG)
1679         {
1680           /* It's a reg copy.  */
1681           SET_REGNO_REG_SET (phi_set, reg);
1682           SET_REGNO_REG_SET (phi_set, REGNO (src));
1683         }
1684       else if (GET_CODE (src) == PHI)
1685         {
1686           /* It's a phi node.  Mark the reg being set.  */
1687           SET_REGNO_REG_SET (phi_set, reg);
1688           /* Mark the regs used in the phi function.  */
1689           for_each_rtx (&src, mark_reg_in_phi, phi_set);
1690         }
1691       /* ... else nothing to do.  */
1692     }
1693 }
1694
1695 /* Rename regs in insn PTR that are equivalent.  DATA is the register
1696    partition which specifies equivalences.  */
1697
1698 static int
1699 rename_equivalent_regs_in_insn (ptr, data)
1700      rtx *ptr;
1701      void* data;
1702 {
1703   rtx x = *ptr;
1704   partition reg_partition = (partition) data;
1705
1706   if (x == NULL_RTX)
1707     return 0;
1708
1709   switch (GET_CODE (x))
1710     {
1711     case SET:
1712       {
1713         rtx *destp = &SET_DEST (x);
1714         rtx dest = SET_DEST (x);
1715
1716         /* Subregs at word 0 are interesting.  Subregs at word != 0 are
1717            presumed to be part of a contiguous multi-word set sequence.  */
1718         while (GET_CODE (dest) == SUBREG
1719                && SUBREG_WORD (dest) == 0)
1720           {
1721             destp = &SUBREG_REG (dest);
1722             dest = SUBREG_REG (dest);
1723           }
1724
1725         if (GET_CODE (dest) == REG
1726             && REGNO (dest) >= FIRST_PSEUDO_REGISTER)
1727           {
1728             /* Got a pseudo; replace it.  */
1729             int regno = REGNO (dest);
1730             int new_regno = partition_find (reg_partition, regno);
1731             if (regno != new_regno)
1732               *destp = regno_reg_rtx[new_regno];
1733
1734             for_each_rtx (&SET_SRC (x),
1735                           rename_equivalent_regs_in_insn,
1736                           data);
1737             return -1;
1738           }
1739
1740         /* Otherwise, this was not an interesting destination.  Continue
1741            on, marking uses as normal.  */
1742         return 0;
1743       }
1744
1745     case REG:
1746       if (REGNO (x) >= FIRST_PSEUDO_REGISTER)
1747         {
1748           int regno = REGNO (x);
1749           int new_regno = partition_find (reg_partition, regno);
1750           if (regno != new_regno)
1751             {
1752               rtx new_reg = regno_reg_rtx[new_regno];
1753               if (GET_MODE (x) != GET_MODE (new_reg))
1754                 abort ();
1755               *ptr = new_reg;
1756             }
1757         }
1758       return -1;
1759
1760     case PHI:
1761       /* No need to rename the phi nodes.  We'll check equivalence
1762          when inserting copies.  */
1763       return -1;
1764
1765     default:
1766       /* Anything else, continue traversing.  */
1767       return 0;
1768     }
1769 }
1770
1771 /* Rename regs that are equivalent in REG_PARTITION.  */
1772
1773 static void
1774 rename_equivalent_regs (reg_partition)
1775      partition reg_partition;
1776 {
1777   int bb;
1778
1779   for (bb = n_basic_blocks; --bb >= 0; )
1780     {
1781       basic_block b = BASIC_BLOCK (bb);
1782       rtx next = b->head;
1783       rtx last = b->end;
1784       rtx insn;
1785
1786       do
1787         {
1788           insn = next;
1789           if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
1790             {
1791               for_each_rtx (&PATTERN (insn),
1792                             rename_equivalent_regs_in_insn,
1793                             reg_partition);
1794               for_each_rtx (&REG_NOTES (insn),
1795                             rename_equivalent_regs_in_insn,
1796                             reg_partition);
1797             }
1798
1799           next = NEXT_INSN (insn);
1800         }
1801       while (insn != last);
1802     }
1803 }
1804
1805 /* The main entry point for moving from SSA.  */
1806
1807 void
1808 convert_from_ssa()
1809 {
1810   int bb;
1811   partition reg_partition;
1812   rtx insns = get_insns ();
1813
1814   /* Need global_live_at_{start,end} up to date.  */
1815   life_analysis (insns, NULL, PROP_KILL_DEAD_CODE | PROP_SCAN_DEAD_CODE);
1816
1817   /* Figure out which regs in copies and phi nodes don't conflict and
1818      therefore can be coalesced.  */
1819   if (conservative_reg_partition)
1820     reg_partition = compute_conservative_reg_partition ();
1821   else
1822     reg_partition = compute_coalesced_reg_partition ();
1823
1824   rename_equivalent_regs (reg_partition);
1825
1826   /* Eliminate the PHI nodes.  */
1827   for (bb = n_basic_blocks; --bb >= 0; )
1828     {
1829       basic_block b = BASIC_BLOCK (bb);
1830       edge e;
1831
1832       for (e = b->pred; e; e = e->pred_next)
1833         if (e->src != ENTRY_BLOCK_PTR)
1834           eliminate_phi (e, reg_partition);
1835     }
1836
1837   partition_delete (reg_partition);
1838
1839   /* Actually delete the PHI nodes.  */
1840   for (bb = n_basic_blocks; --bb >= 0; )
1841     {
1842       rtx insn = BLOCK_HEAD (bb);
1843       int start = (GET_CODE (insn) != CODE_LABEL);
1844
1845       if (! start)
1846         insn = next_nonnote_insn (insn);
1847       while (PHI_NODE_P (insn))
1848         {
1849           /* If a phi node is the last insn in the block, there must
1850              have been nothing else.  Set the block end to the block
1851              head.  */
1852           if (insn == BLOCK_END (bb))
1853             BLOCK_END (bb) = BLOCK_HEAD (bb);
1854           insn = delete_insn (insn);
1855           if (GET_CODE (insn) == NOTE)
1856             insn = next_nonnote_insn (insn);
1857         }
1858       if (start)
1859         BLOCK_HEAD (bb) = insn;
1860     }
1861
1862   /* Commit all the copy nodes needed to convert out of SSA form.  */
1863   commit_edge_insertions ();
1864
1865   in_ssa_form = 0;
1866
1867   count_or_remove_death_notes (NULL, 1);
1868 }
1869
1870 /* Scan phi nodes in successors to BB.  For each such phi node that
1871    has a phi alternative value corresponding to BB, invoke FN.  FN
1872    is passed the entire phi node insn, the regno of the set
1873    destination, the regno of the phi argument corresponding to BB,
1874    and DATA.
1875
1876    If FN ever returns non-zero, stops immediately and returns this
1877    value.  Otherwise, returns zero.  */
1878
1879 int
1880 for_each_successor_phi (bb, fn, data)
1881      basic_block bb;
1882      successor_phi_fn fn;
1883      void *data;
1884 {
1885   edge e;
1886
1887   if (bb == EXIT_BLOCK_PTR)
1888     return 0;
1889
1890   /* Scan outgoing edges.  */
1891   for (e = bb->succ; e != NULL; e = e->succ_next)
1892     {
1893       rtx insn;
1894
1895       basic_block successor = e->dest;
1896       if (successor == ENTRY_BLOCK_PTR
1897           || successor == EXIT_BLOCK_PTR)
1898         continue;
1899
1900       /* Advance to the first non-label insn of the successor block.  */
1901       insn = successor->head;
1902       while (insn != NULL
1903              && (GET_CODE (insn) == CODE_LABEL
1904                  || GET_CODE (insn) == NOTE))
1905         insn = NEXT_INSN (insn);
1906
1907       if (insn == NULL)
1908         continue;
1909
1910       /* Scan phi nodes in the successor.  */
1911       for ( ; PHI_NODE_P (insn); insn = NEXT_INSN (insn))
1912         {
1913           int result;
1914           rtx phi_set = PATTERN (insn);
1915           rtx *alternative = phi_alternative (phi_set, bb->index);
1916           rtx phi_src;
1917
1918           /* This phi function may not have an alternative
1919              corresponding to the incoming edge, indicating the
1920              assigned variable is not defined along the edge.  */
1921           if (alternative == NULL)
1922             continue;
1923           phi_src = *alternative;
1924
1925           /* Invoke the callback.  */
1926           result = (*fn) (insn, REGNO (SET_DEST (phi_set)),
1927                           REGNO (phi_src), data);
1928
1929           /* Terminate if requested.  */
1930           if (result != 0)
1931             return result;
1932         }
1933     }
1934
1935   return 0;
1936 }