gcc/reorg.c

   1 /* Perform instruction reorganizations for delay slot filling.
   2    Copyright (C) 1992, 1993, 1994, 1995 Free Software Foundation, Inc.
   3    Contributed by Richard Kenner (kenner@vlsi1.ultra.nyu.edu).
   4    Hacked by Michael Tiemann (tiemann@cygnus.com).
   5
   6 This file is part of GNU CC.
   7
   8 GNU CC is free software; you can redistribute it and/or modify
   9 it under the terms of the GNU General Public License as published by
  10 the Free Software Foundation; either version 2, or (at your option)
  11 any later version.
  12
  13 GNU CC is distributed in the hope that it will be useful,
  14 but WITHOUT ANY WARRANTY; without even the implied warranty of
  15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  16 GNU General Public License for more details.
  17
  18 You should have received a copy of the GNU General Public License
  19 along with GNU CC; see the file COPYING.  If not, write to
  20 the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.  */
  21
  22 /* Instruction reorganization pass.
  23
  24    This pass runs after register allocation and final jump
  25    optimization.  It should be the last pass to run before peephole.
  26    It serves primarily to fill delay slots of insns, typically branch
  27    and call insns.  Other insns typically involve more complicated
  28    interactions of data dependencies and resource constraints, and
  29    are better handled by scheduling before register allocation (by the
  30    function `schedule_insns').
  31
  32    The Branch Penalty is the number of extra cycles that are needed to
  33    execute a branch insn.  On an ideal machine, branches take a single
  34    cycle, and the Branch Penalty is 0.  Several RISC machines approach
  35    branch delays differently:
  36
  37    The MIPS and AMD 29000 have a single branch delay slot.  Most insns
  38    (except other branches) can be used to fill this slot.  When the
  39    slot is filled, two insns execute in two cycles, reducing the
  40    branch penalty to zero.
  41
  42    The Motorola 88000 conditionally exposes its branch delay slot,
  43    so code is shorter when it is turned off, but will run faster
  44    when useful insns are scheduled there.
  45
  46    The IBM ROMP has two forms of branch and call insns, both with and
  47    without a delay slot.  Much like the 88k, insns not using the delay
  48    slot can be shorted (2 bytes vs. 4 bytes), but will run slowed.
  49
  50    The SPARC always has a branch delay slot, but its effects can be
  51    annulled when the branch is not taken.  This means that failing to
  52    find other sources of insns, we can hoist an insn from the branch
  53    target that would only be safe to execute knowing that the branch
  54    is taken.
  55
  56    The HP-PA always has a branch delay slot.  For unconditional branches
  57    its effects can be annulled when the branch is taken.  The effects
  58    of the delay slot in a conditional branch can be nullified for forward
  59    taken branches, or for untaken backward branches.  This means
  60    we can hoist insns from the fall-through path for forward branches or
  61    steal insns from the target of backward branches.
  62
  63    Three techniques for filling delay slots have been implemented so far:
  64
  65    (1) `fill_simple_delay_slots' is the simplest, most efficient way
  66    to fill delay slots.  This pass first looks for insns which come
  67    from before the branch and which are safe to execute after the
  68    branch.  Then it searches after the insn requiring delay slots or,
  69    in the case of a branch, for insns that are after the point at
  70    which the branch merges into the fallthrough code, if such a point
  71    exists.  When such insns are found, the branch penalty decreases
  72    and no code expansion takes place.
  73
  74    (2) `fill_eager_delay_slots' is more complicated: it is used for
  75    scheduling conditional jumps, or for scheduling jumps which cannot
  76    be filled using (1).  A machine need not have annulled jumps to use
  77    this strategy, but it helps (by keeping more options open).
  78    `fill_eager_delay_slots' tries to guess the direction the branch
  79    will go; if it guesses right 100% of the time, it can reduce the
  80    branch penalty as much as `fill_simple_delay_slots' does.  If it
  81    guesses wrong 100% of the time, it might as well schedule nops (or
  82    on the m88k, unexpose the branch slot).  When
  83    `fill_eager_delay_slots' takes insns from the fall-through path of
  84    the jump, usually there is no code expansion; when it takes insns
  85    from the branch target, there is code expansion if it is not the
  86    only way to reach that target.
  87
  88    (3) `relax_delay_slots' uses a set of rules to simplify code that
  89    has been reorganized by (1) and (2).  It finds cases where
  90    conditional test can be eliminated, jumps can be threaded, extra
  91    insns can be eliminated, etc.  It is the job of (1) and (2) to do a
  92    good job of scheduling locally; `relax_delay_slots' takes care of
  93    making the various individual schedules work well together.  It is
  94    especially tuned to handle the control flow interactions of branch
  95    insns.  It does nothing for insns with delay slots that do not
  96    branch.
  97
  98    On machines that use CC0, we are very conservative.  We will not make
  99    a copy of an insn involving CC0 since we want to maintain a 1-1
 100    correspondence between the insn that sets and uses CC0.  The insns are
 101    allowed to be separated by placing an insn that sets CC0 (but not an insn
 102    that uses CC0; we could do this, but it doesn't seem worthwhile) in a
 103    delay slot.  In that case, we point each insn at the other with REG_CC_USER
 104    and REG_CC_SETTER notes.  Note that these restrictions affect very few
 105    machines because most RISC machines with delay slots will not use CC0
 106    (the RT is the only known exception at this point).
 107
 108    Not yet implemented:
 109
 110    The Acorn Risc Machine can conditionally execute most insns, so
 111    it is profitable to move single insns into a position to execute
 112    based on the condition code of the previous insn.
 113
 114    The HP-PA can conditionally nullify insns, providing a similar
 115    effect to the ARM, differing mostly in which insn is "in charge".   */
 116
 117 #include <stdio.h>
 118 #include "config.h"
 119 #include "rtl.h"
 120 #include "insn-config.h"
 121 #include "conditions.h"
 122 #include "hard-reg-set.h"
 123 #include "basic-block.h"
 124 #include "regs.h"
 125 #include "insn-flags.h"
 126 #include "recog.h"
 127 #include "flags.h"
 128 #include "output.h"
 129 #include "obstack.h"
 130 #include "insn-attr.h"
 131
 132 #ifdef DELAY_SLOTS
 133
 134 #define obstack_chunk_alloc xmalloc
 135 #define obstack_chunk_free free
 136
 137 #ifndef ANNUL_IFTRUE_SLOTS
 138 #define eligible_for_annul_true(INSN, SLOTS, TRIAL, FLAGS) 0
 139 #endif
 140 #ifndef ANNUL_IFFALSE_SLOTS
 141 #define eligible_for_annul_false(INSN, SLOTS, TRIAL, FLAGS) 0
 142 #endif
 143
 144 /* Insns which have delay slots that have not yet been filled.  */
 145
 146 static struct obstack unfilled_slots_obstack;
 147 static rtx *unfilled_firstobj;
 148
 149 /* Define macros to refer to the first and last slot containing unfilled
 150    insns.  These are used because the list may move and its address
 151    should be recomputed at each use.  */
 152
 153 #define unfilled_slots_base     \
 154   ((rtx *) obstack_base (&unfilled_slots_obstack))
 155
 156 #define unfilled_slots_next     \
 157   ((rtx *) obstack_next_free (&unfilled_slots_obstack))
 158
 159 /* This structure is used to indicate which hardware resources are set or
 160    needed by insns so far.  */
 161
 162 struct resources
 163 {
 164   char memory;                  /* Insn sets or needs a memory location.  */
 165   char volatil;                 /* Insn sets or needs a volatile memory loc. */
 166   char cc;                      /* Insn sets or needs the condition codes.  */
 167   HARD_REG_SET regs;            /* Which registers are set or needed.  */
 168 };
 169
 170 /* Macro to clear all resources.  */
 171 #define CLEAR_RESOURCE(RES)     \
 172  do { (RES)->memory = (RES)->volatil = (RES)->cc = 0;   \
 173       CLEAR_HARD_REG_SET ((RES)->regs); } while (0)
 174
 175 /* Indicates what resources are required at the beginning of the epilogue.  */
 176 static struct resources start_of_epilogue_needs;
 177
 178 /* Indicates what resources are required at function end.  */
 179 static struct resources end_of_function_needs;
 180
 181 /* Points to the label before the end of the function.  */
 182 static rtx end_of_function_label;
 183
 184 /* This structure is used to record liveness information at the targets or
 185    fallthrough insns of branches.  We will most likely need the information
 186    at targets again, so save them in a hash table rather than recomputing them
 187    each time.  */
 188
 189 struct target_info
 190 {
 191   int uid;                      /* INSN_UID of target.  */
 192   struct target_info *next;     /* Next info for same hash bucket.  */
 193   HARD_REG_SET live_regs;       /* Registers live at target.  */
 194   int block;                    /* Basic block number containing target.  */
 195   int bb_tick;                  /* Generation count of basic block info.  */
 196 };
 197
 198 #define TARGET_HASH_PRIME 257
 199
 200 /* Define the hash table itself.  */
 201 static struct target_info **target_hash_table;
 202
 203 /* For each basic block, we maintain a generation number of its basic
 204    block info, which is updated each time we move an insn from the
 205    target of a jump.  This is the generation number indexed by block
 206    number.  */
 207
 208 static int *bb_ticks;
 209
 210 /* Mapping between INSN_UID's and position in the code since INSN_UID's do
 211    not always monotonically increase.  */
 212 static int *uid_to_ruid;
 213
 214 /* Highest valid index in `uid_to_ruid'.  */
 215 static int max_uid;
 216
 217 static void mark_referenced_resources PROTO((rtx, struct resources *, int));
 218 static void mark_set_resources  PROTO((rtx, struct resources *, int, int));
 219 static int stop_search_p        PROTO((rtx, int));
 220 static int resource_conflicts_p PROTO((struct resources *,
 221                                        struct resources *));
 222 static int insn_references_resource_p PROTO((rtx, struct resources *, int));
 223 static int insn_sets_resources_p PROTO((rtx, struct resources *, int));
 224 static rtx find_end_label       PROTO((void));
 225 static rtx emit_delay_sequence  PROTO((rtx, rtx, int, int));
 226 static rtx add_to_delay_list    PROTO((rtx, rtx));
 227 static void delete_from_delay_slot PROTO((rtx));
 228 static void delete_scheduled_jump PROTO((rtx));
 229 static void note_delay_statistics PROTO((int, int));
 230 static rtx optimize_skip        PROTO((rtx));
 231 static int get_jump_flags PROTO((rtx, rtx));
 232 static int rare_destination PROTO((rtx));
 233 static int mostly_true_jump     PROTO((rtx, rtx));
 234 static rtx get_branch_condition PROTO((rtx, rtx));
 235 static int condition_dominates_p PROTO((rtx, rtx));
 236 static rtx steal_delay_list_from_target PROTO((rtx, rtx, rtx, rtx,
 237                                                struct resources *,
 238                                                struct resources *,
 239                                                struct resources *,
 240                                                int, int *, int *, rtx *));
 241 static rtx steal_delay_list_from_fallthrough PROTO((rtx, rtx, rtx, rtx,
 242                                                     struct resources *,
 243                                                     struct resources *,
 244                                                     struct resources *,
 245                                                     int, int *, int *));
 246 static void try_merge_delay_insns PROTO((rtx, rtx));
 247 static rtx redundant_insn       PROTO((rtx, rtx, rtx));
 248 static int own_thread_p         PROTO((rtx, rtx, int));
 249 static int find_basic_block     PROTO((rtx));
 250 static void update_block        PROTO((rtx, rtx));
 251 static int reorg_redirect_jump PROTO((rtx, rtx));
 252 static void update_reg_dead_notes PROTO((rtx, rtx));
 253 static void update_reg_unused_notes PROTO((rtx, rtx));
 254 static void update_live_status  PROTO((rtx, rtx));
 255 static rtx next_insn_no_annul   PROTO((rtx));
 256 static void mark_target_live_regs PROTO((rtx, struct resources *));
 257 static void fill_simple_delay_slots PROTO((rtx, int));
 258 static rtx fill_slots_from_thread PROTO((rtx, rtx, rtx, rtx, int, int,
 259                                          int, int, int, int *));
 260 static void fill_eager_delay_slots PROTO((rtx));
 261 static void relax_delay_slots   PROTO((rtx));
 262 static void make_return_insns   PROTO((rtx));
 263 static int redirect_with_delay_slots_safe_p PROTO ((rtx, rtx, rtx));
 264 static int redirect_with_delay_list_safe_p PROTO ((rtx, rtx, rtx));
 265 \f
 266 /* Given X, some rtl, and RES, a pointer to a `struct resource', mark
 267    which resources are references by the insn.  If INCLUDE_CALLED_ROUTINE
 268    is TRUE, resources used by the called routine will be included for
 269    CALL_INSNs.  */
 270
 271 static void
 272 mark_referenced_resources (x, res, include_delayed_effects)
 273      register rtx x;
 274      register struct resources *res;
 275      register int include_delayed_effects;
 276 {
 277   register enum rtx_code code = GET_CODE (x);
 278   register int i, j;
 279   register char *format_ptr;
 280
 281   /* Handle leaf items for which we set resource flags.  Also, special-case
 282      CALL, SET and CLOBBER operators.  */
 283   switch (code)
 284     {
 285     case CONST:
 286     case CONST_INT:
 287     case CONST_DOUBLE:
 288     case PC:
 289     case SYMBOL_REF:
 290     case LABEL_REF:
 291       return;
 292
 293     case SUBREG:
 294       if (GET_CODE (SUBREG_REG (x)) != REG)
 295         mark_referenced_resources (SUBREG_REG (x), res, 0);
 296       else
 297         {
 298           int regno = REGNO (SUBREG_REG (x)) + SUBREG_WORD (x);
 299           int last_regno = regno + HARD_REGNO_NREGS (regno, GET_MODE (x));
 300           for (i = regno; i < last_regno; i++)
 301             SET_HARD_REG_BIT (res->regs, i);
 302         }
 303       return;
 304
 305     case REG:
 306       for (i = 0; i < HARD_REGNO_NREGS (REGNO (x), GET_MODE (x)); i++)
 307         SET_HARD_REG_BIT (res->regs, REGNO (x) + i);
 308       return;
 309
 310     case MEM:
 311       /* If this memory shouldn't change, it really isn't referencing
 312          memory.  */
 313       if (! RTX_UNCHANGING_P (x))
 314         res->memory = 1;
 315       res->volatil = MEM_VOLATILE_P (x);
 316
 317       /* Mark registers used to access memory.  */
 318       mark_referenced_resources (XEXP (x, 0), res, 0);
 319       return;
 320
 321     case CC0:
 322       res->cc = 1;
 323       return;
 324
 325     case UNSPEC_VOLATILE:
 326     case ASM_INPUT:
 327       /* Traditional asm's are always volatile.  */
 328       res->volatil = 1;
 329       return;
 330
 331     case ASM_OPERANDS:
 332       res->volatil = MEM_VOLATILE_P (x);
 333
 334       /* For all ASM_OPERANDS, we must traverse the vector of input operands.
 335          We can not just fall through here since then we would be confused
 336          by the ASM_INPUT rtx inside ASM_OPERANDS, which do not indicate
 337          traditional asms unlike their normal usage.  */
 338
 339       for (i = 0; i < ASM_OPERANDS_INPUT_LENGTH (x); i++)
 340         mark_referenced_resources (ASM_OPERANDS_INPUT (x, i), res, 0);
 341       return;
 342
 343     case CALL:
 344       /* The first operand will be a (MEM (xxx)) but doesn't really reference
 345          memory.  The second operand may be referenced, though.  */
 346       mark_referenced_resources (XEXP (XEXP (x, 0), 0), res, 0);
 347       mark_referenced_resources (XEXP (x, 1), res, 0);
 348       return;
 349
 350     case SET:
 351       /* Usually, the first operand of SET is set, not referenced.  But
 352          registers used to access memory are referenced.  SET_DEST is
 353          also referenced if it is a ZERO_EXTRACT or SIGN_EXTRACT.  */
 354
 355       mark_referenced_resources (SET_SRC (x), res, 0);
 356
 357       x = SET_DEST (x);
 358       if (GET_CODE (x) == SIGN_EXTRACT || GET_CODE (x) == ZERO_EXTRACT)
 359         mark_referenced_resources (x, res, 0);
 360       else if (GET_CODE (x) == SUBREG)
 361         x = SUBREG_REG (x);
 362       if (GET_CODE (x) == MEM)
 363         mark_referenced_resources (XEXP (x, 0), res, 0);
 364       return;
 365
 366     case CLOBBER:
 367       return;
 368
 369     case CALL_INSN:
 370       if (include_delayed_effects)
 371         {
 372           /* A CALL references memory, the frame pointer if it exists, the
 373              stack pointer, any global registers and any registers given in
 374              USE insns immediately in front of the CALL.
 375
 376              However, we may have moved some of the parameter loading insns
 377              into the delay slot of this CALL.  If so, the USE's for them
 378              don't count and should be skipped.  */
 379           rtx insn = PREV_INSN (x);
 380           rtx sequence = 0;
 381           int seq_size = 0;
 382           int i;
 383
 384           /* If we are part of a delay slot sequence, point at the SEQUENCE. */
 385           if (NEXT_INSN (insn) != x)
 386             {
 387               sequence = PATTERN (NEXT_INSN (insn));
 388               seq_size = XVECLEN (sequence, 0);
 389               if (GET_CODE (sequence) != SEQUENCE)
 390                 abort ();
 391             }
 392
 393           res->memory = 1;
 394           SET_HARD_REG_BIT (res->regs, STACK_POINTER_REGNUM);
 395           if (frame_pointer_needed)
 396             {
 397               SET_HARD_REG_BIT (res->regs, FRAME_POINTER_REGNUM);
 398 #if FRAME_POINTER_REGNUM != HARD_FRAME_POINTER_REGNUM
 399               SET_HARD_REG_BIT (res->regs, HARD_FRAME_POINTER_REGNUM);
 400 #endif
 401             }
 402
 403           for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
 404             if (global_regs[i])
 405               SET_HARD_REG_BIT (res->regs, i);
 406
 407           {
 408             rtx link;
 409
 410             for (link = CALL_INSN_FUNCTION_USAGE (x);
 411                  link;
 412                  link = XEXP (link, 1))
 413               if (GET_CODE (XEXP (link, 0)) == USE)
 414                 {
 415                   for (i = 1; i < seq_size; i++)
 416                     {
 417                       rtx slot_pat = PATTERN (XVECEXP (sequence, 0, i));
 418                       if (GET_CODE (slot_pat) == SET
 419                           && rtx_equal_p (SET_DEST (slot_pat),
 420                                           SET_DEST (XEXP (link, 0))))
 421                         break;
 422                     }
 423                   if (i >= seq_size)
 424                     mark_referenced_resources (SET_DEST (XEXP (link, 0)),
 425                                                res, 0);
 426                 }
 427           }
 428         }
 429
 430       /* ... fall through to other INSN processing ... */
 431
 432     case INSN:
 433     case JUMP_INSN:
 434
 435 #ifdef INSN_REFERENCES_ARE_DELAYED
 436       if (! include_delayed_effects
 437           && INSN_REFERENCES_ARE_DELAYED (x))
 438         return;
 439 #endif
 440
 441       /* No special processing, just speed up.  */
 442       mark_referenced_resources (PATTERN (x), res, include_delayed_effects);
 443       return;
 444     }
 445
 446   /* Process each sub-expression and flag what it needs.  */
 447   format_ptr = GET_RTX_FORMAT (code);
 448   for (i = 0; i < GET_RTX_LENGTH (code); i++)
 449     switch (*format_ptr++)
 450       {
 451       case 'e':
 452         mark_referenced_resources (XEXP (x, i), res, include_delayed_effects);
 453         break;
 454
 455       case 'E':
 456         for (j = 0; j < XVECLEN (x, i); j++)
 457           mark_referenced_resources (XVECEXP (x, i, j), res,
 458                                      include_delayed_effects);
 459         break;
 460       }
 461 }
 462 \f
 463 /* Given X, a part of an insn, and a pointer to a `struct resource', RES,
 464    indicate which resources are modified by the insn. If INCLUDE_CALLED_ROUTINE
 465    is nonzero, also mark resources potentially set by the called routine.
 466
 467    If IN_DEST is nonzero, it means we are inside a SET.  Otherwise,
 468    objects are being referenced instead of set.
 469
 470    We never mark the insn as modifying the condition code unless it explicitly
 471    SETs CC0 even though this is not totally correct.  The reason for this is
 472    that we require a SET of CC0 to immediately precede the reference to CC0.
 473    So if some other insn sets CC0 as a side-effect, we know it cannot affect
 474    our computation and thus may be placed in a delay slot.   */
 475
 476 static void
 477 mark_set_resources (x, res, in_dest, include_delayed_effects)
 478      register rtx x;
 479      register struct resources *res;
 480      int in_dest;
 481      int include_delayed_effects;
 482 {
 483   register enum rtx_code code;
 484   register int i, j;
 485   register char *format_ptr;
 486
 487  restart:
 488
 489   code = GET_CODE (x);
 490
 491   switch (code)
 492     {
 493     case NOTE:
 494     case BARRIER:
 495     case CODE_LABEL:
 496     case USE:
 497     case CONST_INT:
 498     case CONST_DOUBLE:
 499     case LABEL_REF:
 500     case SYMBOL_REF:
 501     case CONST:
 502     case PC:
 503       /* These don't set any resources.  */
 504       return;
 505
 506     case CC0:
 507       if (in_dest)
 508         res->cc = 1;
 509       return;
 510
 511     case CALL_INSN:
 512       /* Called routine modifies the condition code, memory, any registers
 513          that aren't saved across calls, global registers and anything
 514          explicitly CLOBBERed immediately after the CALL_INSN.  */
 515
 516       if (include_delayed_effects)
 517         {
 518           rtx next = NEXT_INSN (x);
 519           rtx prev = PREV_INSN (x);
 520           rtx link;
 521
 522           res->cc = res->memory = 1;
 523           for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
 524             if (call_used_regs[i] || global_regs[i])
 525               SET_HARD_REG_BIT (res->regs, i);
 526
 527           /* If X is part of a delay slot sequence, then NEXT should be
 528              the first insn after the sequence.  */
 529           if (NEXT_INSN (prev) != x)
 530             next = NEXT_INSN (NEXT_INSN (prev));
 531
 532           for (link = CALL_INSN_FUNCTION_USAGE (x);
 533                link; link = XEXP (link, 1))
 534             if (GET_CODE (XEXP (link, 0)) == CLOBBER)
 535               mark_set_resources (SET_DEST (XEXP (link, 0)), res, 1, 0);
 536
 537           /* Check for a NOTE_INSN_SETJMP.  If it exists, then we must
 538              assume that this call can clobber any register.  */
 539           if (next && GET_CODE (next) == NOTE
 540               && NOTE_LINE_NUMBER (next) == NOTE_INSN_SETJMP)
 541             SET_HARD_REG_SET (res->regs);
 542         }
 543
 544       /* ... and also what it's RTL says it modifies, if anything.  */
 545
 546     case JUMP_INSN:
 547     case INSN:
 548
 549         /* An insn consisting of just a CLOBBER (or USE) is just for flow
 550            and doesn't actually do anything, so we ignore it.  */
 551
 552 #ifdef INSN_SETS_ARE_DELAYED
 553       if (! include_delayed_effects
 554           && INSN_SETS_ARE_DELAYED (x))
 555         return;
 556 #endif
 557
 558       x = PATTERN (x);
 559       if (GET_CODE (x) != USE && GET_CODE (x) != CLOBBER)
 560         goto restart;
 561       return;
 562
 563     case SET:
 564       /* If the source of a SET is a CALL, this is actually done by
 565          the called routine.  So only include it if we are to include the
 566          effects of the calling routine.  */
 567
 568       mark_set_resources (SET_DEST (x), res,
 569                           (include_delayed_effects
 570                            || GET_CODE (SET_SRC (x)) != CALL),
 571                           0);
 572
 573       mark_set_resources (SET_SRC (x), res, 0, 0);
 574       return;
 575
 576     case CLOBBER:
 577       mark_set_resources (XEXP (x, 0), res, 1, 0);
 578       return;
 579
 580     case SEQUENCE:
 581       for (i = 0; i < XVECLEN (x, 0); i++)
 582         if (! (INSN_ANNULLED_BRANCH_P (XVECEXP (x, 0, 0))
 583                && INSN_FROM_TARGET_P (XVECEXP (x, 0, i))))
 584           mark_set_resources (XVECEXP (x, 0, i), res, 0,
 585                               include_delayed_effects);
 586       return;
 587
 588     case POST_INC:
 589     case PRE_INC:
 590     case POST_DEC:
 591     case PRE_DEC:
 592       mark_set_resources (XEXP (x, 0), res, 1, 0);
 593       return;
 594
 595     case ZERO_EXTRACT:
 596       mark_set_resources (XEXP (x, 0), res, in_dest, 0);
 597       mark_set_resources (XEXP (x, 1), res, 0, 0);
 598       mark_set_resources (XEXP (x, 2), res, 0, 0);
 599       return;
 600
 601     case MEM:
 602       if (in_dest)
 603         {
 604           res->memory = 1;
 605           res->volatil = MEM_VOLATILE_P (x);
 606         }
 607
 608       mark_set_resources (XEXP (x, 0), res, 0, 0);
 609       return;
 610
 611     case SUBREG:
 612       if (in_dest)
 613         {
 614           if (GET_CODE (SUBREG_REG (x)) != REG)
 615             mark_set_resources (SUBREG_REG (x), res,
 616                                 in_dest, include_delayed_effects);
 617           else
 618             {
 619               int regno = REGNO (SUBREG_REG (x)) + SUBREG_WORD (x);
 620               int last_regno = regno + HARD_REGNO_NREGS (regno, GET_MODE (x));
 621               for (i = regno; i < last_regno; i++)
 622                 SET_HARD_REG_BIT (res->regs, i);
 623             }
 624         }
 625       return;
 626
 627     case REG:
 628       if (in_dest)
 629         for (i = 0; i < HARD_REGNO_NREGS (REGNO (x), GET_MODE (x)); i++)
 630           SET_HARD_REG_BIT (res->regs, REGNO (x) + i);
 631       return;
 632     }
 633
 634   /* Process each sub-expression and flag what it needs.  */
 635   format_ptr = GET_RTX_FORMAT (code);
 636   for (i = 0; i < GET_RTX_LENGTH (code); i++)
 637     switch (*format_ptr++)
 638       {
 639       case 'e':
 640         mark_set_resources (XEXP (x, i), res, in_dest, include_delayed_effects);
 641         break;
 642
 643       case 'E':
 644         for (j = 0; j < XVECLEN (x, i); j++)
 645           mark_set_resources (XVECEXP (x, i, j), res, in_dest,
 646                               include_delayed_effects);
 647         break;
 648       }
 649 }
 650 \f
 651 /* Return TRUE if this insn should stop the search for insn to fill delay
 652    slots.  LABELS_P indicates that labels should terminate the search.
 653    In all cases, jumps terminate the search.  */
 654
 655 static int
 656 stop_search_p (insn, labels_p)
 657      rtx insn;
 658      int labels_p;
 659 {
 660   if (insn == 0)
 661     return 1;
 662
 663   switch (GET_CODE (insn))
 664     {
 665     case NOTE:
 666     case CALL_INSN:
 667       return 0;
 668
 669     case CODE_LABEL:
 670       return labels_p;
 671
 672     case JUMP_INSN:
 673     case BARRIER:
 674       return 1;
 675
 676     case INSN:
 677       /* OK unless it contains a delay slot or is an `asm' insn of some type.
 678          We don't know anything about these.  */
 679       return (GET_CODE (PATTERN (insn)) == SEQUENCE
 680               || GET_CODE (PATTERN (insn)) == ASM_INPUT
 681               || asm_noperands (PATTERN (insn)) >= 0);
 682
 683     default:
 684       abort ();
 685     }
 686 }
 687 \f
 688 /* Return TRUE if any resources are marked in both RES1 and RES2 or if either
 689    resource set contains a volatile memory reference.  Otherwise, return FALSE.  */
 690
 691 static int
 692 resource_conflicts_p (res1, res2)
 693      struct resources *res1, *res2;
 694 {
 695   if ((res1->cc && res2->cc) || (res1->memory && res2->memory)
 696       || res1->volatil || res2->volatil)
 697     return 1;
 698
 699 #ifdef HARD_REG_SET
 700   return (res1->regs & res2->regs) != HARD_CONST (0);
 701 #else
 702   {
 703     int i;
 704
 705     for (i = 0; i < HARD_REG_SET_LONGS; i++)
 706       if ((res1->regs[i] & res2->regs[i]) != 0)
 707         return 1;
 708     return 0;
 709   }
 710 #endif
 711 }
 712
 713 /* Return TRUE if any resource marked in RES, a `struct resources', is
 714    referenced by INSN.  If INCLUDE_CALLED_ROUTINE is set, return if the called
 715    routine is using those resources.
 716
 717    We compute this by computing all the resources referenced by INSN and
 718    seeing if this conflicts with RES.  It might be faster to directly check
 719    ourselves, and this is the way it used to work, but it means duplicating
 720    a large block of complex code.  */
 721
 722 static int
 723 insn_references_resource_p (insn, res, include_delayed_effects)
 724      register rtx insn;
 725      register struct resources *res;
 726      int include_delayed_effects;
 727 {
 728   struct resources insn_res;
 729
 730   CLEAR_RESOURCE (&insn_res);
 731   mark_referenced_resources (insn, &insn_res, include_delayed_effects);
 732   return resource_conflicts_p (&insn_res, res);
 733 }
 734
 735 /* Return TRUE if INSN modifies resources that are marked in RES.
 736    INCLUDE_CALLED_ROUTINE is set if the actions of that routine should be
 737    included.   CC0 is only modified if it is explicitly set; see comments
 738    in front of mark_set_resources for details.  */
 739
 740 static int
 741 insn_sets_resource_p (insn, res, include_delayed_effects)
 742      register rtx insn;
 743      register struct resources *res;
 744      int include_delayed_effects;
 745 {
 746   struct resources insn_sets;
 747
 748   CLEAR_RESOURCE (&insn_sets);
 749   mark_set_resources (insn, &insn_sets, 0, include_delayed_effects);
 750   return resource_conflicts_p (&insn_sets, res);
 751 }
 752 \f
 753 /* Find a label at the end of the function or before a RETURN.  If there is
 754    none, make one.  */
 755
 756 static rtx
 757 find_end_label ()
 758 {
 759   rtx insn;
 760
 761   /* If we found one previously, return it.  */
 762   if (end_of_function_label)
 763     return end_of_function_label;
 764
 765   /* Otherwise, see if there is a label at the end of the function.  If there
 766      is, it must be that RETURN insns aren't needed, so that is our return
 767      label and we don't have to do anything else.  */
 768
 769   insn = get_last_insn ();
 770   while (GET_CODE (insn) == NOTE
 771          || (GET_CODE (insn) == INSN
 772              && (GET_CODE (PATTERN (insn)) == USE
 773                  || GET_CODE (PATTERN (insn)) == CLOBBER)))
 774     insn = PREV_INSN (insn);
 775
 776   /* When a target threads its epilogue we might already have a
 777      suitable return insn.  If so put a label before it for the
 778      end_of_function_label.  */
 779   if (GET_CODE (insn) == BARRIER
 780       && GET_CODE (PREV_INSN (insn)) == JUMP_INSN
 781       && GET_CODE (PATTERN (PREV_INSN (insn))) == RETURN)
 782     {
 783       rtx temp = PREV_INSN (PREV_INSN (insn));
 784       end_of_function_label = gen_label_rtx ();
 785       LABEL_NUSES (end_of_function_label) = 0;
 786
 787       /* Put the label before an USE insns that may proceed the RETURN insn. */
 788       while (GET_CODE (temp) == USE)
 789         temp = PREV_INSN (temp);
 790
 791       emit_label_after (end_of_function_label, temp);
 792     }
 793
 794   else if (GET_CODE (insn) == CODE_LABEL)
 795     end_of_function_label = insn;
 796   else
 797     {
 798       /* Otherwise, make a new label and emit a RETURN and BARRIER,
 799          if needed.  */
 800       end_of_function_label = gen_label_rtx ();
 801       LABEL_NUSES (end_of_function_label) = 0;
 802       emit_label (end_of_function_label);
 803 #ifdef HAVE_return
 804       if (HAVE_return)
 805         {
 806           /* The return we make may have delay slots too.  */
 807           rtx insn = gen_return ();
 808           insn = emit_jump_insn (insn);
 809           emit_barrier ();
 810           if (num_delay_slots (insn) > 0)
 811             obstack_ptr_grow (&unfilled_slots_obstack, insn);
 812         }
 813 #endif
 814     }
 815
 816   /* Show one additional use for this label so it won't go away until
 817      we are done.  */
 818   ++LABEL_NUSES (end_of_function_label);
 819
 820   return end_of_function_label;
 821 }
 822 \f
 823 /* Put INSN and LIST together in a SEQUENCE rtx of LENGTH, and replace
 824    the pattern of INSN with the SEQUENCE.
 825
 826    Chain the insns so that NEXT_INSN of each insn in the sequence points to
 827    the next and NEXT_INSN of the last insn in the sequence points to
 828    the first insn after the sequence.  Similarly for PREV_INSN.  This makes
 829    it easier to scan all insns.
 830
 831    Returns the SEQUENCE that replaces INSN.  */
 832
 833 static rtx
 834 emit_delay_sequence (insn, list, length, avail)
 835      rtx insn;
 836      rtx list;
 837      int length;
 838      int avail;
 839 {
 840   register int i = 1;
 841   register rtx li;
 842   int had_barrier = 0;
 843
 844   /* Allocate the the rtvec to hold the insns and the SEQUENCE. */
 845   rtvec seqv = rtvec_alloc (length + 1);
 846   rtx seq = gen_rtx (SEQUENCE, VOIDmode, seqv);
 847   rtx seq_insn = make_insn_raw (seq);
 848   rtx first = get_insns ();
 849   rtx last = get_last_insn ();
 850
 851   /* Make a copy of the insn having delay slots. */
 852   rtx delay_insn = copy_rtx (insn);
 853
 854   /* If INSN is followed by a BARRIER, delete the BARRIER since it will only
 855      confuse further processing.  Update LAST in case it was the last insn.
 856      We will put the BARRIER back in later.  */
 857   if (NEXT_INSN (insn) && GET_CODE (NEXT_INSN (insn)) == BARRIER)
 858     {
 859       delete_insn (NEXT_INSN (insn));
 860       last = get_last_insn ();
 861       had_barrier = 1;
 862     }
 863
 864   /* Splice our SEQUENCE into the insn stream where INSN used to be.  */
 865   NEXT_INSN (seq_insn) = NEXT_INSN (insn);
 866   PREV_INSN (seq_insn) = PREV_INSN (insn);
 867
 868   if (insn == last)
 869     set_new_first_and_last_insn (first, seq_insn);
 870   else
 871     PREV_INSN (NEXT_INSN (seq_insn)) = seq_insn;
 872
 873   if (insn == first)
 874     set_new_first_and_last_insn (seq_insn, last);
 875   else
 876     NEXT_INSN (PREV_INSN (seq_insn)) = seq_insn;
 877
 878   /* Build our SEQUENCE and rebuild the insn chain.  */
 879   XVECEXP (seq, 0, 0) = delay_insn;
 880   INSN_DELETED_P (delay_insn) = 0;
 881   PREV_INSN (delay_insn) = PREV_INSN (seq_insn);
 882
 883   for (li = list; li; li = XEXP (li, 1), i++)
 884     {
 885       rtx tem = XEXP (li, 0);
 886       rtx note;
 887
 888       /* Show that this copy of the insn isn't deleted.  */
 889       INSN_DELETED_P (tem) = 0;
 890
 891       XVECEXP (seq, 0, i) = tem;
 892       PREV_INSN (tem) = XVECEXP (seq, 0, i - 1);
 893       NEXT_INSN (XVECEXP (seq, 0, i - 1)) = tem;
 894
 895       /* Remove any REG_DEAD notes because we can't rely on them now
 896          that the insn has been moved.  */
 897       for (note = REG_NOTES (tem); note; note = XEXP (note, 1))
 898         if (REG_NOTE_KIND (note) == REG_DEAD)
 899           XEXP (note, 0) = const0_rtx;
 900     }
 901
 902   NEXT_INSN (XVECEXP (seq, 0, length)) = NEXT_INSN (seq_insn);
 903
 904   /* If the previous insn is a SEQUENCE, update the NEXT_INSN pointer on the
 905      last insn in that SEQUENCE to point to us.  Similarly for the first
 906      insn in the following insn if it is a SEQUENCE.  */
 907
 908   if (PREV_INSN (seq_insn) && GET_CODE (PREV_INSN (seq_insn)) == INSN
 909       && GET_CODE (PATTERN (PREV_INSN (seq_insn))) == SEQUENCE)
 910     NEXT_INSN (XVECEXP (PATTERN (PREV_INSN (seq_insn)), 0,
 911                         XVECLEN (PATTERN (PREV_INSN (seq_insn)), 0) - 1))
 912       = seq_insn;
 913
 914   if (NEXT_INSN (seq_insn) && GET_CODE (NEXT_INSN (seq_insn)) == INSN
 915       && GET_CODE (PATTERN (NEXT_INSN (seq_insn))) == SEQUENCE)
 916     PREV_INSN (XVECEXP (PATTERN (NEXT_INSN (seq_insn)), 0, 0)) = seq_insn;
 917
 918   /* If there used to be a BARRIER, put it back.  */
 919   if (had_barrier)
 920     emit_barrier_after (seq_insn);
 921
 922   if (i != length + 1)
 923     abort ();
 924
 925   return seq_insn;
 926 }
 927
 928 /* Add INSN to DELAY_LIST and return the head of the new list.  The list must
 929    be in the order in which the insns are to be executed.  */
 930
 931 static rtx
 932 add_to_delay_list (insn, delay_list)
 933      rtx insn;
 934      rtx delay_list;
 935 {
 936   /* If we have an empty list, just make a new list element.  If
 937      INSN has it's block number recorded, clear it since we may
 938      be moving the insn to a new block.  */
 939
 940   if (delay_list == 0)
 941     {
 942       struct target_info *tinfo;
 943
 944       for (tinfo = target_hash_table[INSN_UID (insn) % TARGET_HASH_PRIME];
 945            tinfo; tinfo = tinfo->next)
 946         if (tinfo->uid == INSN_UID (insn))
 947           break;
 948
 949       if (tinfo)
 950         tinfo->block = -1;
 951
 952       return gen_rtx (INSN_LIST, VOIDmode, insn, NULL_RTX);
 953     }
 954
 955   /* Otherwise this must be an INSN_LIST.  Add INSN to the end of the
 956      list.  */
 957   XEXP (delay_list, 1) = add_to_delay_list (insn, XEXP (delay_list, 1));
 958
 959   return delay_list;
 960 }
 961 \f
 962 /* Delete INSN from the the delay slot of the insn that it is in.  This may
 963    produce an insn without anything in its delay slots.  */
 964
 965 static void
 966 delete_from_delay_slot (insn)
 967      rtx insn;
 968 {
 969   rtx trial, seq_insn, seq, prev;
 970   rtx delay_list = 0;
 971   int i;
 972
 973   /* We first must find the insn containing the SEQUENCE with INSN in its
 974      delay slot.  Do this by finding an insn, TRIAL, where
 975      PREV_INSN (NEXT_INSN (TRIAL)) != TRIAL.  */
 976
 977   for (trial = insn;
 978        PREV_INSN (NEXT_INSN (trial)) == trial;
 979        trial = NEXT_INSN (trial))
 980     ;
 981
 982   seq_insn = PREV_INSN (NEXT_INSN (trial));
 983   seq = PATTERN (seq_insn);
 984
 985   /* Create a delay list consisting of all the insns other than the one
 986      we are deleting (unless we were the only one).  */
 987   if (XVECLEN (seq, 0) > 2)
 988     for (i = 1; i < XVECLEN (seq, 0); i++)
 989       if (XVECEXP (seq, 0, i) != insn)
 990         delay_list = add_to_delay_list (XVECEXP (seq, 0, i), delay_list);
 991
 992   /* Delete the old SEQUENCE, re-emit the insn that used to have the delay
 993      list, and rebuild the delay list if non-empty.  */
 994   prev = PREV_INSN (seq_insn);
 995   trial = XVECEXP (seq, 0, 0);
 996   delete_insn (seq_insn);
 997   add_insn_after (trial, prev);
 998
 999   if (GET_CODE (trial) == JUMP_INSN
1000       && (simplejump_p (trial) || GET_CODE (PATTERN (trial)) == RETURN))
1001     emit_barrier_after (trial);
1002
1003   /* If there are any delay insns, remit them.  Otherwise clear the
1004      annul flag.  */
1005   if (delay_list)
1006     trial = emit_delay_sequence (trial, delay_list, XVECLEN (seq, 0) - 2, 0);
1007   else
1008     INSN_ANNULLED_BRANCH_P (trial) = 0;
1009
1010   INSN_FROM_TARGET_P (insn) = 0;
1011
1012   /* Show we need to fill this insn again.  */
1013   obstack_ptr_grow (&unfilled_slots_obstack, trial);
1014 }
1015 \f
1016 /* Delete INSN, a JUMP_INSN.  If it is a conditional jump, we must track down
1017    the insn that sets CC0 for it and delete it too.  */
1018
1019 static void
1020 delete_scheduled_jump (insn)
1021      rtx insn;
1022 {
1023   /* Delete the insn that sets cc0 for us.  On machines without cc0, we could
1024      delete the insn that sets the condition code, but it is hard to find it.
1025      Since this case is rare anyway, don't bother trying; there would likely
1026      be other insns that became dead anyway, which we wouldn't know to
1027      delete.  */
1028
1029 #ifdef HAVE_cc0
1030   if (reg_mentioned_p (cc0_rtx, insn))
1031     {
1032       rtx note = find_reg_note (insn, REG_CC_SETTER, NULL_RTX);
1033
1034       /* If a reg-note was found, it points to an insn to set CC0.  This
1035          insn is in the delay list of some other insn.  So delete it from
1036          the delay list it was in.  */
1037       if (note)
1038         {
1039           if (! FIND_REG_INC_NOTE (XEXP (note, 0), NULL_RTX)
1040               && sets_cc0_p (PATTERN (XEXP (note, 0))) == 1)
1041             delete_from_delay_slot (XEXP (note, 0));
1042         }
1043       else
1044         {
1045           /* The insn setting CC0 is our previous insn, but it may be in
1046              a delay slot.  It will be the last insn in the delay slot, if
1047              it is.  */
1048           rtx trial = previous_insn (insn);
1049           if (GET_CODE (trial) == NOTE)
1050             trial = prev_nonnote_insn (trial);
1051           if (sets_cc0_p (PATTERN (trial)) != 1
1052               || FIND_REG_INC_NOTE (trial, 0))
1053             return;
1054           if (PREV_INSN (NEXT_INSN (trial)) == trial)
1055             delete_insn (trial);
1056           else
1057             delete_from_delay_slot (trial);
1058         }
1059     }
1060 #endif
1061
1062   delete_insn (insn);
1063 }
1064 \f
1065 /* Counters for delay-slot filling.  */
1066
1067 #define NUM_REORG_FUNCTIONS 2
1068 #define MAX_DELAY_HISTOGRAM 3
1069 #define MAX_REORG_PASSES 2
1070
1071 static int num_insns_needing_delays[NUM_REORG_FUNCTIONS][MAX_REORG_PASSES];
1072
1073 static int num_filled_delays[NUM_REORG_FUNCTIONS][MAX_DELAY_HISTOGRAM+1][MAX_REORG_PASSES];
1074
1075 static int reorg_pass_number;
1076
1077 static void
1078 note_delay_statistics (slots_filled, index)
1079      int slots_filled, index;
1080 {
1081   num_insns_needing_delays[index][reorg_pass_number]++;
1082   if (slots_filled > MAX_DELAY_HISTOGRAM)
1083     slots_filled = MAX_DELAY_HISTOGRAM;
1084   num_filled_delays[index][slots_filled][reorg_pass_number]++;
1085 }
1086 \f
1087 #if defined(ANNUL_IFFALSE_SLOTS) || defined(ANNUL_IFTRUE_SLOTS)
1088
1089 /* Optimize the following cases:
1090
1091    1.  When a conditional branch skips over only one instruction,
1092        use an annulling branch and put that insn in the delay slot.
1093        Use either a branch that annuls when the condition if true or
1094        invert the test with a branch that annuls when the condition is
1095        false.  This saves insns, since otherwise we must copy an insn
1096        from the L1 target.
1097
1098         (orig)           (skip)         (otherwise)
1099         Bcc.n L1        Bcc',a L1       Bcc,a L1'
1100         insn            insn            insn2
1101       L1:             L1:             L1:
1102         insn2           insn2           insn2
1103         insn3           insn3         L1':
1104                                         insn3
1105
1106    2.  When a conditional branch skips over only one instruction,
1107        and after that, it unconditionally branches somewhere else,
1108        perform the similar optimization. This saves executing the
1109        second branch in the case where the inverted condition is true.
1110
1111         Bcc.n L1        Bcc',a L2
1112         insn            insn
1113       L1:             L1:
1114         Bra L2          Bra L2
1115
1116    INSN is a JUMP_INSN.
1117
1118    This should be expanded to skip over N insns, where N is the number
1119    of delay slots required.  */
1120
1121 static rtx
1122 optimize_skip (insn)
1123      register rtx insn;
1124 {
1125   register rtx trial = next_nonnote_insn (insn);
1126   rtx next_trial = next_active_insn (trial);
1127   rtx delay_list = 0;
1128   rtx target_label;
1129   int flags;
1130
1131   flags = get_jump_flags (insn, JUMP_LABEL (insn));
1132
1133   if (trial == 0
1134       || GET_CODE (trial) != INSN
1135       || GET_CODE (PATTERN (trial)) == SEQUENCE
1136       || recog_memoized (trial) < 0
1137       || (! eligible_for_annul_false (insn, 0, trial, flags)
1138           && ! eligible_for_annul_true (insn, 0, trial, flags)))
1139     return 0;
1140
1141   /* There are two cases where we are just executing one insn (we assume
1142      here that a branch requires only one insn; this should be generalized
1143      at some point):  Where the branch goes around a single insn or where
1144      we have one insn followed by a branch to the same label we branch to.
1145      In both of these cases, inverting the jump and annulling the delay
1146      slot give the same effect in fewer insns.  */
1147   if ((next_trial == next_active_insn (JUMP_LABEL (insn)))
1148       || (next_trial != 0
1149           && GET_CODE (next_trial) == JUMP_INSN
1150           && JUMP_LABEL (insn) == JUMP_LABEL (next_trial)
1151           && (simplejump_p (next_trial)
1152               || GET_CODE (PATTERN (next_trial)) == RETURN)))
1153     {
1154       if (eligible_for_annul_false (insn, 0, trial, flags))
1155         {
1156           if (invert_jump (insn, JUMP_LABEL (insn)))
1157             INSN_FROM_TARGET_P (trial) = 1;
1158           else if (! eligible_for_annul_true (insn, 0, trial, flags))
1159             return 0;
1160         }
1161
1162       delay_list = add_to_delay_list (trial, NULL_RTX);
1163       next_trial = next_active_insn (trial);
1164       update_block (trial, trial);
1165       delete_insn (trial);
1166
1167       /* Also, if we are targeting an unconditional
1168          branch, thread our jump to the target of that branch.  Don't
1169          change this into a RETURN here, because it may not accept what
1170          we have in the delay slot.  We'll fix this up later.  */
1171       if (next_trial && GET_CODE (next_trial) == JUMP_INSN
1172           && (simplejump_p (next_trial)
1173               || GET_CODE (PATTERN (next_trial)) == RETURN))
1174         {
1175           target_label = JUMP_LABEL (next_trial);
1176           if (target_label == 0)
1177             target_label = find_end_label ();
1178
1179           /* Recompute the flags based on TARGET_LABEL since threading
1180              the jump to TARGET_LABEL may change the direction of the
1181              jump (which may change the circumstances in which the
1182              delay slot is nullified).  */
1183           flags = get_jump_flags (insn, target_label);
1184           if (eligible_for_annul_true (insn, 0, trial, flags))
1185             reorg_redirect_jump (insn, target_label);
1186         }
1187
1188       INSN_ANNULLED_BRANCH_P (insn) = 1;
1189     }
1190
1191   return delay_list;
1192 }
1193 #endif
1194 \f
1195
1196 /*  Encode and return branch direction and prediction information for
1197     INSN assuming it will jump to LABEL.
1198
1199     Non conditional branches return no direction information and
1200     are predicted as very likely taken.  */
1201 static int
1202 get_jump_flags (insn, label)
1203      rtx insn, label;
1204 {
1205   int flags;
1206
1207   /* get_jump_flags can be passed any insn with delay slots, these may
1208      be INSNs, CALL_INSNs, or JUMP_INSNs.  Only JUMP_INSNs have branch
1209      direction information, and only if they are conditional jumps.
1210
1211      If LABEL is zero, then there is no way to determine the branch
1212      direction.  */
1213   if (GET_CODE (insn) == JUMP_INSN
1214       && (condjump_p (insn) || condjump_in_parallel_p (insn))
1215       && INSN_UID (insn) <= max_uid
1216       && label != 0
1217       && INSN_UID (label) <= max_uid)
1218     flags
1219       = (uid_to_ruid[INSN_UID (label)] > uid_to_ruid[INSN_UID (insn)])
1220          ? ATTR_FLAG_forward : ATTR_FLAG_backward;
1221   /* No valid direction information.  */
1222   else
1223     flags = 0;
1224
1225   /* If insn is a conditional branch call mostly_true_jump to get
1226      determine the branch prediction.
1227
1228      Non conditional branches are predicted as very likely taken.  */
1229   if (GET_CODE (insn) == JUMP_INSN
1230       && (condjump_p (insn) || condjump_in_parallel_p (insn)))
1231     {
1232       int prediction;
1233
1234       prediction = mostly_true_jump (insn, get_branch_condition (insn, label));
1235       switch (prediction)
1236         {
1237           case 2:
1238             flags |= (ATTR_FLAG_very_likely | ATTR_FLAG_likely);
1239             break;
1240           case 1:
1241             flags |= ATTR_FLAG_likely;
1242             break;
1243           case 0:
1244             flags |= ATTR_FLAG_unlikely;
1245             break;
1246           case -1:
1247             flags |= (ATTR_FLAG_very_unlikely | ATTR_FLAG_unlikely);
1248             break;
1249
1250           default:
1251             abort();
1252         }
1253     }
1254   else
1255     flags |= (ATTR_FLAG_very_likely | ATTR_FLAG_likely);
1256
1257   return flags;
1258 }
1259
1260 /* Return 1 if INSN is a destination that will be branched to rarely (the
1261    return point of a function); return 2 if DEST will be branched to very
1262    rarely (a call to a function that doesn't return).  Otherwise,
1263    return 0.  */
1264
1265 static int
1266 rare_destination (insn)
1267      rtx insn;
1268 {
1269   int jump_count = 0;
1270   rtx next;
1271
1272   for (; insn; insn = next)
1273     {
1274       if (GET_CODE (insn) == INSN && GET_CODE (PATTERN (insn)) == SEQUENCE)
1275         insn = XVECEXP (PATTERN (insn), 0, 0);
1276
1277       next = NEXT_INSN (insn);
1278
1279       switch (GET_CODE (insn))
1280         {
1281         case CODE_LABEL:
1282           return 0;
1283         case BARRIER:
1284           /* A BARRIER can either be after a JUMP_INSN or a CALL_INSN.  We
1285              don't scan past JUMP_INSNs, so any barrier we find here must
1286              have been after a CALL_INSN and hence mean the call doesn't
1287              return.  */
1288           return 2;
1289         case JUMP_INSN:
1290           if (GET_CODE (PATTERN (insn)) == RETURN)
1291             return 1;
1292           else if (simplejump_p (insn)
1293                    && jump_count++ < 10)
1294             next = JUMP_LABEL (insn);
1295           else
1296             return 0;
1297         }
1298     }
1299
1300   /* If we got here it means we hit the end of the function.  So this
1301      is an unlikely destination.  */
1302
1303   return 1;
1304 }
1305
1306 /* Return truth value of the statement that this branch
1307    is mostly taken.  If we think that the branch is extremely likely
1308    to be taken, we return 2.  If the branch is slightly more likely to be
1309    taken, return 1.  If the branch is slightly less likely to be taken,
1310    return 0 and if the branch is highly unlikely to be taken, return -1.
1311
1312    CONDITION, if non-zero, is the condition that JUMP_INSN is testing.  */
1313
1314 static int
1315 mostly_true_jump (jump_insn, condition)
1316      rtx jump_insn, condition;
1317 {
1318   rtx target_label = JUMP_LABEL (jump_insn);
1319   rtx insn;
1320   int rare_dest = rare_destination (target_label);
1321   int rare_fallthrough = rare_destination (NEXT_INSN (jump_insn));
1322
1323   /* If this is a branch outside a loop, it is highly unlikely.  */
1324   if (GET_CODE (PATTERN (jump_insn)) == SET
1325       && GET_CODE (SET_SRC (PATTERN (jump_insn))) == IF_THEN_ELSE
1326       && ((GET_CODE (XEXP (SET_SRC (PATTERN (jump_insn)), 1)) == LABEL_REF
1327            && LABEL_OUTSIDE_LOOP_P (XEXP (SET_SRC (PATTERN (jump_insn)), 1)))
1328           || (GET_CODE (XEXP (SET_SRC (PATTERN (jump_insn)), 2)) == LABEL_REF
1329               && LABEL_OUTSIDE_LOOP_P (XEXP (SET_SRC (PATTERN (jump_insn)), 2)))))
1330     return -1;
1331
1332   if (target_label)
1333     {
1334       /* If this is the test of a loop, it is very likely true.  We scan
1335          backwards from the target label.  If we find a NOTE_INSN_LOOP_BEG
1336          before the next real insn, we assume the branch is to the top of
1337          the loop.  */
1338       for (insn = PREV_INSN (target_label);
1339            insn && GET_CODE (insn) == NOTE;
1340            insn = PREV_INSN (insn))
1341         if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
1342           return 2;
1343
1344       /* If this is a jump to the test of a loop, it is likely true.  We scan
1345          forwards from the target label.  If we find a NOTE_INSN_LOOP_VTOP
1346          before the next real insn, we assume the branch is to the loop branch
1347          test.  */
1348       for (insn = NEXT_INSN (target_label);
1349            insn && GET_CODE (insn) == NOTE;
1350            insn = PREV_INSN (insn))
1351         if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_VTOP)
1352           return 1;
1353     }
1354
1355   /* Look at the relative rarities of the fallthough and destination.  If
1356      they differ, we can predict the branch that way. */
1357
1358   switch (rare_fallthrough - rare_dest)
1359     {
1360     case -2:
1361       return -1;
1362     case -1:
1363       return 0;
1364     case 0:
1365       break;
1366     case 1:
1367       return 1;
1368     case 2:
1369       return 2;
1370     }
1371
1372   /* If we couldn't figure out what this jump was, assume it won't be
1373      taken.  This should be rare.  */
1374   if (condition == 0)
1375     return 0;
1376
1377   /* EQ tests are usually false and NE tests are usually true.  Also,
1378      most quantities are positive, so we can make the appropriate guesses
1379      about signed comparisons against zero.  */
1380   switch (GET_CODE (condition))
1381     {
1382     case CONST_INT:
1383       /* Unconditional branch.  */
1384       return 1;
1385     case EQ:
1386       return 0;
1387     case NE:
1388       return 1;
1389     case LE:
1390     case LT:
1391       if (XEXP (condition, 1) == const0_rtx)
1392         return 0;
1393       break;
1394     case GE:
1395     case GT:
1396       if (XEXP (condition, 1) == const0_rtx)
1397         return 1;
1398       break;
1399     }
1400
1401   /* Predict backward branches usually take, forward branches usually not.  If
1402      we don't know whether this is forward or backward, assume the branch
1403      will be taken, since most are.  */
1404   return (target_label == 0 || INSN_UID (jump_insn) > max_uid
1405           || INSN_UID (target_label) > max_uid
1406           || (uid_to_ruid[INSN_UID (jump_insn)]
1407               > uid_to_ruid[INSN_UID (target_label)]));;
1408 }
1409
1410 /* Return the condition under which INSN will branch to TARGET.  If TARGET
1411    is zero, return the condition under which INSN will return.  If INSN is
1412    an unconditional branch, return const_true_rtx.  If INSN isn't a simple
1413    type of jump, or it doesn't go to TARGET, return 0.  */
1414
1415 static rtx
1416 get_branch_condition (insn, target)
1417      rtx insn;
1418      rtx target;
1419 {
1420   rtx pat = PATTERN (insn);
1421   rtx src;
1422
1423   if (condjump_in_parallel_p (insn))
1424     pat = XVECEXP (pat, 0, 0);
1425
1426   if (GET_CODE (pat) == RETURN)
1427     return target == 0 ? const_true_rtx : 0;
1428
1429   else if (GET_CODE (pat) != SET || SET_DEST (pat) != pc_rtx)
1430     return 0;
1431
1432   src = SET_SRC (pat);
1433   if (GET_CODE (src) == LABEL_REF && XEXP (src, 0) == target)
1434     return const_true_rtx;
1435
1436   else if (GET_CODE (src) == IF_THEN_ELSE
1437            && ((target == 0 && GET_CODE (XEXP (src, 1)) == RETURN)
1438                || (GET_CODE (XEXP (src, 1)) == LABEL_REF
1439                    && XEXP (XEXP (src, 1), 0) == target))
1440            && XEXP (src, 2) == pc_rtx)
1441     return XEXP (src, 0);
1442
1443   else if (GET_CODE (src) == IF_THEN_ELSE
1444            && ((target == 0 && GET_CODE (XEXP (src, 2)) == RETURN)
1445                || (GET_CODE (XEXP (src, 2)) == LABEL_REF
1446                    && XEXP (XEXP (src, 2), 0) == target))
1447            && XEXP (src, 1) == pc_rtx)
1448     return gen_rtx (reverse_condition (GET_CODE (XEXP (src, 0))),
1449                     GET_MODE (XEXP (src, 0)),
1450                     XEXP (XEXP (src, 0), 0), XEXP (XEXP (src, 0), 1));
1451
1452   return 0;
1453 }
1454
1455 /* Return non-zero if CONDITION is more strict than the condition of
1456    INSN, i.e., if INSN will always branch if CONDITION is true.  */
1457
1458 static int
1459 condition_dominates_p (condition, insn)
1460      rtx condition;
1461      rtx insn;
1462 {
1463   rtx other_condition = get_branch_condition (insn, JUMP_LABEL (insn));
1464   enum rtx_code code = GET_CODE (condition);
1465   enum rtx_code other_code;
1466
1467   if (rtx_equal_p (condition, other_condition)
1468       || other_condition == const_true_rtx)
1469     return 1;
1470
1471   else if (condition == const_true_rtx || other_condition == 0)
1472     return 0;
1473
1474   other_code = GET_CODE (other_condition);
1475   if (GET_RTX_LENGTH (code) != 2 || GET_RTX_LENGTH (other_code) != 2
1476       || ! rtx_equal_p (XEXP (condition, 0), XEXP (other_condition, 0))
1477       || ! rtx_equal_p (XEXP (condition, 1), XEXP (other_condition, 1)))
1478     return 0;
1479
1480   return comparison_dominates_p (code, other_code);
1481 }
1482
1483 /* Return non-zero if redirecting JUMP to NEWLABEL does not invalidate
1484    any insns already in the delay slot of JUMP.  */
1485
1486 static int
1487 redirect_with_delay_slots_safe_p (jump, newlabel, seq)
1488      rtx jump, newlabel, seq;
1489 {
1490   int flags, slots, i;
1491   rtx pat = PATTERN (seq);
1492
1493   /* Make sure all the delay slots of this jump would still
1494      be valid after threading the jump.  If they are still
1495      valid, then return non-zero.  */
1496
1497   flags = get_jump_flags (jump, newlabel);
1498   for (i = 1; i < XVECLEN (pat, 0); i++)
1499     if (! (
1500 #ifdef ANNUL_IFFALSE_SLOTS
1501            (INSN_ANNULLED_BRANCH_P (jump)
1502             && INSN_FROM_TARGET_P (XVECEXP (pat, 0, i)))
1503            ? eligible_for_annul_false (jump, i - 1,
1504                                        XVECEXP (pat, 0, i), flags) :
1505 #endif
1506 #ifdef ANNUL_IFTRUE_SLOTS
1507            (INSN_ANNULLED_BRANCH_P (jump)
1508             && ! INSN_FROM_TARGET_P (XVECEXP (pat, 0, i)))
1509            ? eligible_for_annul_true (jump, i - 1,
1510                                       XVECEXP (pat, 0, i), flags) :
1511 #endif
1512            eligible_for_delay (jump, i -1, XVECEXP (pat, 0, i), flags)))
1513       break;
1514
1515   return (i == XVECLEN (pat, 0));
1516 }
1517
1518 /* Return non-zero if redirecting JUMP to NEWLABEL does not invalidate
1519    any insns we wish to place in the delay slot of JUMP.  */
1520
1521 static int
1522 redirect_with_delay_list_safe_p (jump, newlabel, delay_list)
1523      rtx jump, newlabel, delay_list;
1524 {
1525   int flags, i;
1526   rtx li;
1527
1528   /* Make sure all the insns in DELAY_LIST would still be
1529      valid after threading the jump.  If they are still
1530      valid, then return non-zero.  */
1531
1532   flags = get_jump_flags (jump, newlabel);
1533   for (li = delay_list, i = 0; li; li = XEXP (li, 1), i++)
1534     if (! (
1535 #ifdef ANNUL_IFFALSE_SLOTS
1536            (INSN_ANNULLED_BRANCH_P (jump)
1537             && INSN_FROM_TARGET_P (XEXP (li, 0)))
1538            ? eligible_for_annul_false (jump, i, XEXP (li, 0), flags) :
1539 #endif
1540 #ifdef ANNUL_IFTRUE_SLOTS
1541            (INSN_ANNULLED_BRANCH_P (jump)
1542             && ! INSN_FROM_TARGET_P (XEXP (li, 0)))
1543            ? eligible_for_annul_true (jump, i, XEXP (li, 0), flags) :
1544 #endif
1545            eligible_for_delay (jump, i, XEXP (li, 0), flags)))
1546       break;
1547
1548   return (li == NULL);
1549 }
1550
1551 \f
1552 /* INSN branches to an insn whose pattern SEQ is a SEQUENCE.  Given that
1553    the condition tested by INSN is CONDITION and the resources shown in
1554    OTHER_NEEDED are needed after INSN, see whether INSN can take all the insns
1555    from SEQ's delay list, in addition to whatever insns it may execute
1556    (in DELAY_LIST).   SETS and NEEDED are denote resources already set and
1557    needed while searching for delay slot insns.  Return the concatenated
1558    delay list if possible, otherwise, return 0.
1559
1560    SLOTS_TO_FILL is the total number of slots required by INSN, and
1561    PSLOTS_FILLED points to the number filled so far (also the number of
1562    insns in DELAY_LIST).  It is updated with the number that have been
1563    filled from the SEQUENCE, if any.
1564
1565    PANNUL_P points to a non-zero value if we already know that we need
1566    to annul INSN.  If this routine determines that annulling is needed,
1567    it may set that value non-zero.
1568
1569    PNEW_THREAD points to a location that is to receive the place at which
1570    execution should continue.  */
1571
1572 static rtx
1573 steal_delay_list_from_target (insn, condition, seq, delay_list,
1574                               sets, needed, other_needed,
1575                               slots_to_fill, pslots_filled, pannul_p,
1576                               pnew_thread)
1577      rtx insn, condition;
1578      rtx seq;
1579      rtx delay_list;
1580      struct resources *sets, *needed, *other_needed;
1581      int slots_to_fill;
1582      int *pslots_filled;
1583      int *pannul_p;
1584      rtx *pnew_thread;
1585 {
1586   rtx temp;
1587   int slots_remaining = slots_to_fill - *pslots_filled;
1588   int total_slots_filled = *pslots_filled;
1589   rtx new_delay_list = 0;
1590   int must_annul = *pannul_p;
1591   int i;
1592
1593   /* We can't do anything if there are more delay slots in SEQ than we
1594      can handle, or if we don't know that it will be a taken branch.
1595      We know that it will be a taken branch if it is either an unconditional
1596      branch or a conditional branch with a stricter branch condition.
1597
1598      Also, exit if the branch has more than one set, since then it is computing
1599      other results that can't be ignored, e.g. the HPPA mov&branch instruction.
1600      ??? It may be possible to move other sets into INSN in addition to
1601      moving the instructions in the delay slots.  */
1602
1603   if (XVECLEN (seq, 0) - 1 > slots_remaining
1604       || ! condition_dominates_p (condition, XVECEXP (seq, 0, 0))
1605       || ! single_set (XVECEXP (seq, 0, 0)))
1606     return delay_list;
1607
1608   for (i = 1; i < XVECLEN (seq, 0); i++)
1609     {
1610       rtx trial = XVECEXP (seq, 0, i);
1611       int flags;
1612
1613       if (insn_references_resource_p (trial, sets, 0)
1614           || insn_sets_resource_p (trial, needed, 0)
1615           || insn_sets_resource_p (trial, sets, 0)
1616 #ifdef HAVE_cc0
1617           /* If TRIAL sets CC0, we can't copy it, so we can't steal this
1618              delay list.  */
1619           || find_reg_note (trial, REG_CC_USER, NULL_RTX)
1620 #endif
1621           /* If TRIAL is from the fallthrough code of an annulled branch insn
1622              in SEQ, we cannot use it.  */
1623           || (INSN_ANNULLED_BRANCH_P (XVECEXP (seq, 0, 0))
1624               && ! INSN_FROM_TARGET_P (trial)))
1625         return delay_list;
1626
1627       /* If this insn was already done (usually in a previous delay slot),
1628          pretend we put it in our delay slot.  */
1629       if (redundant_insn (trial, insn, new_delay_list))
1630         continue;
1631
1632       /* We will end up re-vectoring this branch, so compute flags
1633          based on jumping to the new label.  */
1634       flags = get_jump_flags (insn, JUMP_LABEL (XVECEXP (seq, 0, 0)));
1635
1636       if (! must_annul
1637           && ((condition == const_true_rtx
1638                || (! insn_sets_resource_p (trial, other_needed, 0)
1639                    && ! may_trap_p (PATTERN (trial)))))
1640           ? eligible_for_delay (insn, total_slots_filled, trial, flags)
1641           : (must_annul = 1,
1642              eligible_for_annul_false (insn, total_slots_filled, trial, flags)))
1643         {
1644           temp = copy_rtx (trial);
1645           INSN_FROM_TARGET_P (temp) = 1;
1646           new_delay_list = add_to_delay_list (temp, new_delay_list);
1647           total_slots_filled++;
1648
1649           if (--slots_remaining == 0)
1650             break;
1651         }
1652       else
1653         return delay_list;
1654     }
1655
1656   /* Show the place to which we will be branching.  */
1657   *pnew_thread = next_active_insn (JUMP_LABEL (XVECEXP (seq, 0, 0)));
1658
1659   /* Add any new insns to the delay list and update the count of the
1660      number of slots filled.  */
1661   *pslots_filled = total_slots_filled;
1662   *pannul_p = must_annul;
1663
1664   if (delay_list == 0)
1665     return new_delay_list;
1666
1667   for (temp = new_delay_list; temp; temp = XEXP (temp, 1))
1668     delay_list = add_to_delay_list (XEXP (temp, 0), delay_list);
1669
1670   return delay_list;
1671 }
1672 \f
1673 /* Similar to steal_delay_list_from_target except that SEQ is on the
1674    fallthrough path of INSN.  Here we only do something if the delay insn
1675    of SEQ is an unconditional branch.  In that case we steal its delay slot
1676    for INSN since unconditional branches are much easier to fill.  */
1677
1678 static rtx
1679 steal_delay_list_from_fallthrough (insn, condition, seq,
1680                                    delay_list, sets, needed, other_needed,
1681                                    slots_to_fill, pslots_filled, pannul_p)
1682      rtx insn, condition;
1683      rtx seq;
1684      rtx delay_list;
1685      struct resources *sets, *needed, *other_needed;
1686      int slots_to_fill;
1687      int *pslots_filled;
1688      int *pannul_p;
1689 {
1690   int i;
1691   int flags;
1692
1693   flags = get_jump_flags (insn, JUMP_LABEL (insn));
1694
1695   /* We can't do anything if SEQ's delay insn isn't an
1696      unconditional branch.  */
1697
1698   if (! simplejump_p (XVECEXP (seq, 0, 0))
1699       && GET_CODE (PATTERN (XVECEXP (seq, 0, 0))) != RETURN)
1700     return delay_list;
1701
1702   for (i = 1; i < XVECLEN (seq, 0); i++)
1703     {
1704       rtx trial = XVECEXP (seq, 0, i);
1705
1706       /* If TRIAL sets CC0, stealing it will move it too far from the use
1707          of CC0.  */
1708       if (insn_references_resource_p (trial, sets, 0)
1709           || insn_sets_resource_p (trial, needed, 0)
1710           || insn_sets_resource_p (trial, sets, 0)
1711 #ifdef HAVE_cc0
1712           || sets_cc0_p (PATTERN (trial))
1713 #endif
1714           )
1715
1716         break;
1717
1718       /* If this insn was already done, we don't need it.  */
1719       if (redundant_insn (trial, insn, delay_list))
1720         {
1721           delete_from_delay_slot (trial);
1722           continue;
1723         }
1724
1725       if (! *pannul_p
1726           && ((condition == const_true_rtx
1727                || (! insn_sets_resource_p (trial, other_needed, 0)
1728                    && ! may_trap_p (PATTERN (trial)))))
1729           ? eligible_for_delay (insn, *pslots_filled, trial, flags)
1730           : (*pannul_p = 1,
1731              eligible_for_annul_true (insn, *pslots_filled, trial, flags)))
1732         {
1733           delete_from_delay_slot (trial);
1734           delay_list = add_to_delay_list (trial, delay_list);
1735
1736           if (++(*pslots_filled) == slots_to_fill)
1737             break;
1738         }
1739       else
1740         break;
1741     }
1742
1743   return delay_list;
1744 }
1745 \f
1746 /* Try merging insns starting at THREAD which match exactly the insns in
1747    INSN's delay list.
1748
1749    If all insns were matched and the insn was previously annulling, the
1750    annul bit will be cleared.
1751
1752    For each insn that is merged, if the branch is or will be non-annulling,
1753    we delete the merged insn.  */
1754
1755 static void
1756 try_merge_delay_insns (insn, thread)
1757      rtx insn, thread;
1758 {
1759   rtx trial, next_trial;
1760   rtx delay_insn = XVECEXP (PATTERN (insn), 0, 0);
1761   int annul_p = INSN_ANNULLED_BRANCH_P (delay_insn);
1762   int slot_number = 1;
1763   int num_slots = XVECLEN (PATTERN (insn), 0);
1764   rtx next_to_match = XVECEXP (PATTERN (insn), 0, slot_number);
1765   struct resources set, needed;
1766   rtx merged_insns = 0;
1767   int i;
1768   int flags;
1769
1770   flags = get_jump_flags (delay_insn, JUMP_LABEL (delay_insn));
1771
1772   CLEAR_RESOURCE (&needed);
1773   CLEAR_RESOURCE (&set);
1774
1775   /* If this is not an annulling branch, take into account anything needed in
1776      NEXT_TO_MATCH.  This prevents two increments from being incorrectly
1777      folded into one.  If we are annulling, this would be the correct
1778      thing to do.  (The alternative, looking at things set in NEXT_TO_MATCH
1779      will essentially disable this optimization.  This method is somewhat of
1780      a kludge, but I don't see a better way.)  */
1781   if (! annul_p)
1782     mark_referenced_resources (next_to_match, &needed, 1);
1783
1784   for (trial = thread; !stop_search_p (trial, 1); trial = next_trial)
1785     {
1786       rtx pat = PATTERN (trial);
1787       rtx oldtrial = trial;
1788
1789       next_trial = next_nonnote_insn (trial);
1790
1791       /* TRIAL must be a CALL_INSN or INSN.  Skip USE and CLOBBER.  */
1792       if (GET_CODE (trial) == INSN
1793           && (GET_CODE (pat) == USE || GET_CODE (pat) == CLOBBER))
1794         continue;
1795
1796       if (GET_CODE (next_to_match) == GET_CODE (trial)
1797 #ifdef HAVE_cc0
1798           /* We can't share an insn that sets cc0.  */
1799           && ! sets_cc0_p (pat)
1800 #endif
1801           && ! insn_references_resource_p (trial, &set, 1)
1802           && ! insn_sets_resource_p (trial, &set, 1)
1803           && ! insn_sets_resource_p (trial, &needed, 1)
1804           && (trial = try_split (pat, trial, 0)) != 0
1805           /* Update next_trial, in case try_split succeeded.  */
1806           && (next_trial = next_nonnote_insn (trial))
1807           /* Likewise THREAD.  */
1808           && (thread = oldtrial == thread ? trial : thread)
1809           && rtx_equal_p (PATTERN (next_to_match), PATTERN (trial))
1810           /* Have to test this condition if annul condition is different
1811              from (and less restrictive than) non-annulling one.  */
1812           && eligible_for_delay (delay_insn, slot_number - 1, trial, flags))
1813         {
1814
1815           if (! annul_p)
1816             {
1817               update_block (trial, thread);
1818               if (trial == thread)
1819                 thread = next_active_insn (thread);
1820
1821               delete_insn (trial);
1822               INSN_FROM_TARGET_P (next_to_match) = 0;
1823             }
1824           else
1825             merged_insns = gen_rtx (INSN_LIST, VOIDmode, trial, merged_insns);
1826
1827           if (++slot_number == num_slots)
1828             break;
1829
1830           next_to_match = XVECEXP (PATTERN (insn), 0, slot_number);
1831           if (! annul_p)
1832             mark_referenced_resources (next_to_match, &needed, 1);
1833         }
1834
1835       mark_set_resources (trial, &set, 0, 1);
1836       mark_referenced_resources (trial, &needed, 1);
1837     }
1838
1839   /* See if we stopped on a filled insn.  If we did, try to see if its
1840      delay slots match.  */
1841   if (slot_number != num_slots
1842       && trial && GET_CODE (trial) == INSN
1843       && GET_CODE (PATTERN (trial)) == SEQUENCE
1844       && ! INSN_ANNULLED_BRANCH_P (XVECEXP (PATTERN (trial), 0, 0)))
1845     {
1846       rtx pat = PATTERN (trial);
1847       rtx filled_insn = XVECEXP (pat, 0, 0);
1848
1849       /* Account for resources set/needed by the filled insn.  */
1850       mark_set_resources (filled_insn, &set, 0, 1);
1851       mark_referenced_resources (filled_insn, &needed, 1);
1852
1853       for (i = 1; i < XVECLEN (pat, 0); i++)
1854         {
1855           rtx dtrial = XVECEXP (pat, 0, i);
1856
1857           if (! insn_references_resource_p (dtrial, &set, 1)
1858               && ! insn_sets_resource_p (dtrial, &set, 1)
1859               && ! insn_sets_resource_p (dtrial, &needed, 1)
1860 #ifdef HAVE_cc0
1861               && ! sets_cc0_p (PATTERN (dtrial))
1862 #endif
1863               && rtx_equal_p (PATTERN (next_to_match), PATTERN (dtrial))
1864               && eligible_for_delay (delay_insn, slot_number - 1, dtrial, flags))
1865             {
1866               if (! annul_p)
1867                 {
1868                   update_block (dtrial, thread);
1869                   delete_from_delay_slot (dtrial);
1870                   INSN_FROM_TARGET_P (next_to_match) = 0;
1871                 }
1872               else
1873                 merged_insns = gen_rtx (INSN_LIST, SImode, dtrial,
1874                                         merged_insns);
1875
1876               if (++slot_number == num_slots)
1877                 break;
1878
1879               next_to_match = XVECEXP (PATTERN (insn), 0, slot_number);
1880             }
1881         }
1882     }
1883
1884   /* If all insns in the delay slot have been matched and we were previously
1885      annulling the branch, we need not any more.  In that case delete all the
1886      merged insns.  Also clear the INSN_FROM_TARGET_P bit of each insn the
1887      the delay list so that we know that it isn't only being used at the
1888      target.  */
1889   if (slot_number == num_slots && annul_p)
1890     {
1891       for (; merged_insns; merged_insns = XEXP (merged_insns, 1))
1892         {
1893           if (GET_MODE (merged_insns) == SImode)
1894             {
1895               update_block (XEXP (merged_insns, 0), thread);
1896               delete_from_delay_slot (XEXP (merged_insns, 0));
1897             }
1898           else
1899             {
1900               update_block (XEXP (merged_insns, 0), thread);
1901               delete_insn (XEXP (merged_insns, 0));
1902             }
1903         }
1904
1905       INSN_ANNULLED_BRANCH_P (delay_insn) = 0;
1906
1907       for (i = 0; i < XVECLEN (PATTERN (insn), 0); i++)
1908         INSN_FROM_TARGET_P (XVECEXP (PATTERN (insn), 0, i)) = 0;
1909     }
1910 }
1911 \f
1912 /* See if INSN is redundant with an insn in front of TARGET.  Often this
1913    is called when INSN is a candidate for a delay slot of TARGET.
1914    DELAY_LIST are insns that will be placed in delay slots of TARGET in front
1915    of INSN.  Often INSN will be redundant with an insn in a delay slot of
1916    some previous insn.  This happens when we have a series of branches to the
1917    same label; in that case the first insn at the target might want to go
1918    into each of the delay slots.
1919
1920    If we are not careful, this routine can take up a significant fraction
1921    of the total compilation time (4%), but only wins rarely.  Hence we
1922    speed this routine up by making two passes.  The first pass goes back
1923    until it hits a label and sees if it find an insn with an identical
1924    pattern.  Only in this (relatively rare) event does it check for
1925    data conflicts.
1926
1927    We do not split insns we encounter.  This could cause us not to find a
1928    redundant insn, but the cost of splitting seems greater than the possible
1929    gain in rare cases.  */
1930
1931 static rtx
1932 redundant_insn (insn, target, delay_list)
1933      rtx insn;
1934      rtx target;
1935      rtx delay_list;
1936 {
1937   rtx target_main = target;
1938   rtx ipat = PATTERN (insn);
1939   rtx trial, pat;
1940   struct resources needed, set;
1941   int i;
1942
1943   /* Scan backwards looking for a match.  */
1944   for (trial = PREV_INSN (target); trial; trial = PREV_INSN (trial))
1945     {
1946       if (GET_CODE (trial) == CODE_LABEL)
1947         return 0;
1948
1949       if (GET_RTX_CLASS (GET_CODE (trial)) != 'i')
1950         continue;
1951
1952       pat = PATTERN (trial);
1953       if (GET_CODE (pat) == USE || GET_CODE (pat) == CLOBBER)
1954         continue;
1955
1956       if (GET_CODE (pat) == SEQUENCE)
1957         {
1958           /* Stop for a CALL and its delay slots because it is difficult to
1959              track its resource needs correctly.  */
1960           if (GET_CODE (XVECEXP (pat, 0, 0)) == CALL_INSN)
1961             return 0;
1962
1963           /* Stop for an INSN or JUMP_INSN with delayed effects and its delay
1964              slots because it is difficult to track its resource needs
1965              correctly.  */
1966
1967 #ifdef INSN_SETS_ARE_DELAYED
1968           if (INSN_SETS_ARE_DELAYED (XVECEXP (pat, 0, 0)))
1969             return 0;
1970 #endif
1971
1972 #ifdef INSN_REFERENCES_ARE_DELAYED
1973           if (INSN_REFERENCES_ARE_DELAYED (XVECEXP (pat, 0, 0)))
1974             return 0;
1975 #endif
1976
1977           /* See if any of the insns in the delay slot match, updating
1978              resource requirements as we go.  */
1979           for (i = XVECLEN (pat, 0) - 1; i > 0; i--)
1980             if (GET_CODE (XVECEXP (pat, 0, i)) == GET_CODE (insn)
1981                 && rtx_equal_p (PATTERN (XVECEXP (pat, 0, i)), ipat))
1982               break;
1983
1984           /* If found a match, exit this loop early.  */
1985           if (i > 0)
1986             break;
1987         }
1988
1989       else if (GET_CODE (trial) == GET_CODE (insn) && rtx_equal_p (pat, ipat))
1990         break;
1991     }
1992
1993   /* If we didn't find an insn that matches, return 0.  */
1994   if (trial == 0)
1995     return 0;
1996
1997   /* See what resources this insn sets and needs.  If they overlap, or
1998      if this insn references CC0, it can't be redundant.  */
1999
2000   CLEAR_RESOURCE (&needed);
2001   CLEAR_RESOURCE (&set);
2002   mark_set_resources (insn, &set, 0, 1);
2003   mark_referenced_resources (insn, &needed, 1);
2004
2005   /* If TARGET is a SEQUENCE, get the main insn.  */
2006   if (GET_CODE (target) == INSN && GET_CODE (PATTERN (target)) == SEQUENCE)
2007     target_main = XVECEXP (PATTERN (target), 0, 0);
2008
2009   if (resource_conflicts_p (&needed, &set)
2010 #ifdef HAVE_cc0
2011       || reg_mentioned_p (cc0_rtx, ipat)
2012 #endif
2013       /* The insn requiring the delay may not set anything needed or set by
2014          INSN.  */
2015       || insn_sets_resource_p (target_main, &needed, 1)
2016       || insn_sets_resource_p (target_main, &set, 1))
2017     return 0;
2018
2019   /* Insns we pass may not set either NEEDED or SET, so merge them for
2020      simpler tests.  */
2021   needed.memory |= set.memory;
2022   IOR_HARD_REG_SET (needed.regs, set.regs);
2023
2024   /* This insn isn't redundant if it conflicts with an insn that either is
2025      or will be in a delay slot of TARGET.  */
2026
2027   while (delay_list)
2028     {
2029       if (insn_sets_resource_p (XEXP (delay_list, 0), &needed, 1))
2030         return 0;
2031       delay_list = XEXP (delay_list, 1);
2032     }
2033
2034   if (GET_CODE (target) == INSN && GET_CODE (PATTERN (target)) == SEQUENCE)
2035     for (i = 1; i < XVECLEN (PATTERN (target), 0); i++)
2036       if (insn_sets_resource_p (XVECEXP (PATTERN (target), 0, i), &needed, 1))
2037         return 0;
2038
2039   /* Scan backwards until we reach a label or an insn that uses something
2040      INSN sets or sets something insn uses or sets.  */
2041
2042   for (trial = PREV_INSN (target);
2043        trial && GET_CODE (trial) != CODE_LABEL;
2044        trial = PREV_INSN (trial))
2045     {
2046       if (GET_CODE (trial) != INSN && GET_CODE (trial) != CALL_INSN
2047           && GET_CODE (trial) != JUMP_INSN)
2048         continue;
2049
2050       pat = PATTERN (trial);
2051       if (GET_CODE (pat) == USE || GET_CODE (pat) == CLOBBER)
2052         continue;
2053
2054       if (GET_CODE (pat) == SEQUENCE)
2055         {
2056           /* If this is a CALL_INSN and its delay slots, it is hard to track
2057              the resource needs properly, so give up.  */
2058           if (GET_CODE (XVECEXP (pat, 0, 0)) == CALL_INSN)
2059             return 0;
2060
2061           /* If this this is an INSN or JUMP_INSN with delayed effects, it
2062              is hard to track the resource needs properly, so give up.  */
2063
2064 #ifdef INSN_SETS_ARE_DELAYED
2065           if (INSN_SETS_ARE_DELAYED (XVECEXP (pat, 0, 0)))
2066             return 0;
2067 #endif
2068
2069 #ifdef INSN_REFERENCES_ARE_DELAYED
2070           if (INSN_REFERENCES_ARE_DELAYED (XVECEXP (pat, 0, 0)))
2071             return 0;
2072 #endif
2073
2074           /* See if any of the insns in the delay slot match, updating
2075              resource requirements as we go.  */
2076           for (i = XVECLEN (pat, 0) - 1; i > 0; i--)
2077             {
2078               rtx candidate = XVECEXP (pat, 0, i);
2079
2080               /* If an insn will be annulled if the branch is false, it isn't
2081                  considered as a possible duplicate insn.  */
2082               if (rtx_equal_p (PATTERN (candidate), ipat)
2083                   && ! (INSN_ANNULLED_BRANCH_P (XVECEXP (pat, 0, 0))
2084                         && INSN_FROM_TARGET_P (candidate)))
2085                 {
2086                   /* Show that this insn will be used in the sequel.  */
2087                   INSN_FROM_TARGET_P (candidate) = 0;
2088                   return candidate;
2089                 }
2090
2091               /* Unless this is an annulled insn from the target of a branch,
2092                  we must stop if it sets anything needed or set by INSN.  */
2093               if ((! INSN_ANNULLED_BRANCH_P (XVECEXP (pat, 0, 0))
2094                    || ! INSN_FROM_TARGET_P (candidate))
2095                   && insn_sets_resource_p (candidate, &needed, 1))
2096                 return 0;
2097             }
2098
2099
2100           /* If the insn requiring the delay slot conflicts with INSN, we
2101              must stop.  */
2102           if (insn_sets_resource_p (XVECEXP (pat, 0, 0), &needed, 1))
2103             return 0;
2104         }
2105       else
2106         {
2107           /* See if TRIAL is the same as INSN.  */
2108           pat = PATTERN (trial);
2109           if (rtx_equal_p (pat, ipat))
2110             return trial;
2111
2112           /* Can't go any further if TRIAL conflicts with INSN.  */
2113           if (insn_sets_resource_p (trial, &needed, 1))
2114             return 0;
2115         }
2116     }
2117
2118   return 0;
2119 }
2120 \f
2121 /* Return 1 if THREAD can only be executed in one way.  If LABEL is non-zero,
2122    it is the target of the branch insn being scanned.  If ALLOW_FALLTHROUGH
2123    is non-zero, we are allowed to fall into this thread; otherwise, we are
2124    not.
2125
2126    If LABEL is used more than one or we pass a label other than LABEL before
2127    finding an active insn, we do not own this thread.  */
2128
2129 static int
2130 own_thread_p (thread, label, allow_fallthrough)
2131      rtx thread;
2132      rtx label;
2133      int allow_fallthrough;
2134 {
2135   rtx active_insn;
2136   rtx insn;
2137
2138   /* We don't own the function end.  */
2139   if (thread == 0)
2140     return 0;
2141
2142   /* Get the first active insn, or THREAD, if it is an active insn.  */
2143   active_insn = next_active_insn (PREV_INSN (thread));
2144
2145   for (insn = thread; insn != active_insn; insn = NEXT_INSN (insn))
2146     if (GET_CODE (insn) == CODE_LABEL
2147         && (insn != label || LABEL_NUSES (insn) != 1))
2148       return 0;
2149
2150   if (allow_fallthrough)
2151     return 1;
2152
2153   /* Ensure that we reach a BARRIER before any insn or label.  */
2154   for (insn = prev_nonnote_insn (thread);
2155        insn == 0 || GET_CODE (insn) != BARRIER;
2156        insn = prev_nonnote_insn (insn))
2157     if (insn == 0
2158         || GET_CODE (insn) == CODE_LABEL
2159         || (GET_CODE (insn) == INSN
2160             && GET_CODE (PATTERN (insn)) != USE
2161             && GET_CODE (PATTERN (insn)) != CLOBBER))
2162       return 0;
2163
2164   return 1;
2165 }
2166 \f
2167 /* Find the number of the basic block that starts closest to INSN.  Return -1
2168    if we couldn't find such a basic block.  */
2169
2170 static int
2171 find_basic_block (insn)
2172      rtx insn;
2173 {
2174   int i;
2175
2176   /* Scan backwards to the previous BARRIER.  Then see if we can find a
2177      label that starts a basic block.  Return the basic block number.  */
2178
2179   for (insn = prev_nonnote_insn (insn);
2180        insn && GET_CODE (insn) != BARRIER;
2181        insn = prev_nonnote_insn (insn))
2182     ;
2183
2184   /* The start of the function is basic block zero.  */
2185   if (insn == 0)
2186     return 0;
2187
2188   /* See if any of the upcoming CODE_LABELs start a basic block.  If we reach
2189      anything other than a CODE_LABEL or note, we can't find this code.  */
2190   for (insn = next_nonnote_insn (insn);
2191        insn && GET_CODE (insn) == CODE_LABEL;
2192        insn = next_nonnote_insn (insn))
2193     {
2194       for (i = 0; i < n_basic_blocks; i++)
2195         if (insn == basic_block_head[i])
2196           return i;
2197     }
2198
2199   return -1;
2200 }
2201 \f
2202 /* Called when INSN is being moved from a location near the target of a jump.
2203    We leave a marker of the form (use (INSN)) immediately in front
2204    of WHERE for mark_target_live_regs.  These markers will be deleted when
2205    reorg finishes.
2206
2207    We used to try to update the live status of registers if WHERE is at
2208    the start of a basic block, but that can't work since we may remove a
2209    BARRIER in relax_delay_slots.  */
2210
2211 static void
2212 update_block (insn, where)
2213      rtx insn;
2214      rtx where;
2215 {
2216   int b;
2217
2218   /* Ignore if this was in a delay slot and it came from the target of
2219      a branch.  */
2220   if (INSN_FROM_TARGET_P (insn))
2221     return;
2222
2223   emit_insn_before (gen_rtx (USE, VOIDmode, insn), where);
2224
2225   /* INSN might be making a value live in a block where it didn't use to
2226      be.  So recompute liveness information for this block.  */
2227
2228   b = find_basic_block (insn);
2229   if (b != -1)
2230     bb_ticks[b]++;
2231 }
2232
2233 /* Similar to REDIRECT_JUMP except that we update the BB_TICKS entry for
2234    the basic block containing the jump.  */
2235
2236 static int
2237 reorg_redirect_jump (jump, nlabel)
2238      rtx jump;
2239      rtx nlabel;
2240 {
2241   int b = find_basic_block (jump);
2242
2243   if (b != -1)
2244     bb_ticks[b]++;
2245
2246   return redirect_jump (jump, nlabel);
2247 }
2248
2249 /* Called when INSN is being moved forward into a delay slot of DELAYED_INSN.
2250    We check every instruction between INSN and DELAYED_INSN for REG_DEAD notes
2251    that reference values used in INSN.  If we find one, then we move the
2252    REG_DEAD note to INSN.
2253
2254    This is needed to handle the case where an later insn (after INSN) has a
2255    REG_DEAD note for a register used by INSN, and this later insn subsequently
2256    gets moved before a CODE_LABEL because it is a redundant insn.  In this
2257    case, mark_target_live_regs may be confused into thinking the register
2258    is dead because it sees a REG_DEAD note immediately before a CODE_LABEL.  */
2259
2260 static void
2261 update_reg_dead_notes (insn, delayed_insn)
2262      rtx insn, delayed_insn;
2263 {
2264   rtx p, link, next;
2265
2266   for (p = next_nonnote_insn (insn); p != delayed_insn;
2267        p = next_nonnote_insn (p))
2268     for (link = REG_NOTES (p); link; link = next)
2269       {
2270         next = XEXP (link, 1);
2271
2272         if (REG_NOTE_KIND (link) != REG_DEAD
2273             || GET_CODE (XEXP (link, 0)) != REG)
2274           continue;
2275
2276         if (reg_referenced_p (XEXP (link, 0), PATTERN (insn)))
2277           {
2278             /* Move the REG_DEAD note from P to INSN.  */
2279             remove_note (p, link);
2280             XEXP (link, 1) = REG_NOTES (insn);
2281             REG_NOTES (insn) = link;
2282           }
2283       }
2284 }
2285
2286 /* Delete any REG_UNUSED notes that exist on INSN but not on REDUNDANT_INSN.
2287
2288    This handles the case of udivmodXi4 instructions which optimize their
2289    output depending on whether any REG_UNUSED notes are present.
2290    we must make sure that INSN calculates as many results as REDUNDANT_INSN
2291    does.  */
2292
2293 static void
2294 update_reg_unused_notes (insn, redundant_insn)
2295      rtx insn, redundant_insn;
2296 {
2297   rtx p, link, next;
2298
2299   for (link = REG_NOTES (insn); link; link = next)
2300     {
2301       next = XEXP (link, 1);
2302
2303       if (REG_NOTE_KIND (link) != REG_UNUSED
2304           || GET_CODE (XEXP (link, 0)) != REG)
2305         continue;
2306
2307       if (! find_regno_note (redundant_insn, REG_UNUSED,
2308                              REGNO (XEXP (link, 0))))
2309         remove_note (insn, link);
2310     }
2311 }
2312 \f
2313 /* Marks registers possibly live at the current place being scanned by
2314    mark_target_live_regs.  Used only by next two function.    */
2315
2316 static HARD_REG_SET current_live_regs;
2317
2318 /* Marks registers for which we have seen a REG_DEAD note but no assignment.
2319    Also only used by the next two functions.  */
2320
2321 static HARD_REG_SET pending_dead_regs;
2322
2323 /* Utility function called from mark_target_live_regs via note_stores.
2324    It deadens any CLOBBERed registers and livens any SET registers.  */
2325
2326 static void
2327 update_live_status (dest, x)
2328      rtx dest;
2329      rtx x;
2330 {
2331   int first_regno, last_regno;
2332   int i;
2333
2334   if (GET_CODE (dest) != REG
2335       && (GET_CODE (dest) != SUBREG || GET_CODE (SUBREG_REG (dest)) != REG))
2336     return;
2337
2338   if (GET_CODE (dest) == SUBREG)
2339     first_regno = REGNO (SUBREG_REG (dest)) + SUBREG_WORD (dest);
2340   else
2341     first_regno = REGNO (dest);
2342
2343   last_regno = first_regno + HARD_REGNO_NREGS (first_regno, GET_MODE (dest));
2344
2345   if (GET_CODE (x) == CLOBBER)
2346     for (i = first_regno; i < last_regno; i++)
2347       CLEAR_HARD_REG_BIT (current_live_regs, i);
2348   else
2349     for (i = first_regno; i < last_regno; i++)
2350       {
2351         SET_HARD_REG_BIT (current_live_regs, i);
2352         CLEAR_HARD_REG_BIT (pending_dead_regs, i);
2353       }
2354 }
2355
2356 /* Similar to next_insn, but ignores insns in the delay slots of
2357    an annulled branch.  */
2358
2359 static rtx
2360 next_insn_no_annul (insn)
2361      rtx insn;
2362 {
2363   if (insn)
2364     {
2365       /* If INSN is an annulled branch, skip any insns from the target
2366          of the branch.  */
2367       if (INSN_ANNULLED_BRANCH_P (insn)
2368           && NEXT_INSN (PREV_INSN (insn)) != insn)
2369         while (INSN_FROM_TARGET_P (NEXT_INSN (insn)))
2370           insn = NEXT_INSN (insn);
2371
2372       insn = NEXT_INSN (insn);
2373       if (insn && GET_CODE (insn) == INSN
2374           && GET_CODE (PATTERN (insn)) == SEQUENCE)
2375         insn = XVECEXP (PATTERN (insn), 0, 0);
2376     }
2377
2378   return insn;
2379 }
2380 \f
2381 /* Set the resources that are live at TARGET.
2382
2383    If TARGET is zero, we refer to the end of the current function and can
2384    return our precomputed value.
2385
2386    Otherwise, we try to find out what is live by consulting the basic block
2387    information.  This is tricky, because we must consider the actions of
2388    reload and jump optimization, which occur after the basic block information
2389    has been computed.
2390
2391    Accordingly, we proceed as follows::
2392
2393    We find the previous BARRIER and look at all immediately following labels
2394    (with no intervening active insns) to see if any of them start a basic
2395    block.  If we hit the start of the function first, we use block 0.
2396
2397    Once we have found a basic block and a corresponding first insns, we can
2398    accurately compute the live status from basic_block_live_regs and
2399    reg_renumber.  (By starting at a label following a BARRIER, we are immune
2400    to actions taken by reload and jump.)  Then we scan all insns between
2401    that point and our target.  For each CLOBBER (or for call-clobbered regs
2402    when we pass a CALL_INSN), mark the appropriate registers are dead.  For
2403    a SET, mark them as live.
2404
2405    We have to be careful when using REG_DEAD notes because they are not
2406    updated by such things as find_equiv_reg.  So keep track of registers
2407    marked as dead that haven't been assigned to, and mark them dead at the
2408    next CODE_LABEL since reload and jump won't propagate values across labels.
2409
2410    If we cannot find the start of a basic block (should be a very rare
2411    case, if it can happen at all), mark everything as potentially live.
2412
2413    Next, scan forward from TARGET looking for things set or clobbered
2414    before they are used.  These are not live.
2415
2416    Because we can be called many times on the same target, save our results
2417    in a hash table indexed by INSN_UID.  */
2418
2419 static void
2420 mark_target_live_regs (target, res)
2421      rtx target;
2422      struct resources *res;
2423 {
2424   int b = -1;
2425   int i;
2426   struct target_info *tinfo;
2427   rtx insn, next;
2428   rtx jump_insn = 0;
2429   rtx jump_target;
2430   HARD_REG_SET scratch;
2431   struct resources set, needed;
2432   int jump_count = 0;
2433
2434   /* Handle end of function.  */
2435   if (target == 0)
2436     {
2437       *res = end_of_function_needs;
2438       return;
2439     }
2440
2441   /* We have to assume memory is needed, but the CC isn't.  */
2442   res->memory = 1;
2443   res->volatil = 0;
2444   res->cc = 0;
2445
2446   /* See if we have computed this value already.  */
2447   for (tinfo = target_hash_table[INSN_UID (target) % TARGET_HASH_PRIME];
2448        tinfo; tinfo = tinfo->next)
2449     if (tinfo->uid == INSN_UID (target))
2450       break;
2451
2452   /* Start by getting the basic block number.  If we have saved information,
2453      we can get it from there unless the insn at the start of the basic block
2454      has been deleted.  */
2455   if (tinfo && tinfo->block != -1
2456       && ! INSN_DELETED_P (basic_block_head[tinfo->block]))
2457     b = tinfo->block;
2458
2459   if (b == -1)
2460     b = find_basic_block (target);
2461
2462   if (tinfo)
2463     {
2464       /* If the information is up-to-date, use it.  Otherwise, we will
2465          update it below.  */
2466       if (b == tinfo->block && b != -1 && tinfo->bb_tick == bb_ticks[b])
2467         {
2468           COPY_HARD_REG_SET (res->regs, tinfo->live_regs);
2469           return;
2470         }
2471     }
2472   else
2473     {
2474       /* Allocate a place to put our results and chain it into the
2475          hash table.  */
2476       tinfo = (struct target_info *) oballoc (sizeof (struct target_info));
2477       tinfo->uid = INSN_UID (target);
2478       tinfo->block = b;
2479       tinfo->next = target_hash_table[INSN_UID (target) % TARGET_HASH_PRIME];
2480       target_hash_table[INSN_UID (target) % TARGET_HASH_PRIME] = tinfo;
2481     }
2482
2483   CLEAR_HARD_REG_SET (pending_dead_regs);
2484
2485   /* If we found a basic block, get the live registers from it and update
2486      them with anything set or killed between its start and the insn before
2487      TARGET.  Otherwise, we must assume everything is live.  */
2488   if (b != -1)
2489     {
2490       regset regs_live = basic_block_live_at_start[b];
2491       int offset, j;
2492       REGSET_ELT_TYPE bit;
2493       int regno;
2494       rtx start_insn, stop_insn;
2495
2496       /* Compute hard regs live at start of block -- this is the real hard regs
2497          marked live, plus live pseudo regs that have been renumbered to
2498          hard regs.  */
2499
2500 #ifdef HARD_REG_SET
2501       current_live_regs = *regs_live;
2502 #else
2503       COPY_HARD_REG_SET (current_live_regs, regs_live);
2504 #endif
2505
2506       for (offset = 0, i = 0; offset < regset_size; offset++)
2507         {
2508           if (regs_live[offset] == 0)
2509             i += REGSET_ELT_BITS;
2510           else
2511             for (bit = 1; bit && i < max_regno; bit <<= 1, i++)
2512               if ((regs_live[offset] & bit)
2513                   && (regno = reg_renumber[i]) >= 0)
2514                 for (j = regno;
2515                      j < regno + HARD_REGNO_NREGS (regno,
2516                                                    PSEUDO_REGNO_MODE (i));
2517                      j++)
2518                   SET_HARD_REG_BIT (current_live_regs, j);
2519         }
2520
2521       /* Get starting and ending insn, handling the case where each might
2522          be a SEQUENCE.  */
2523       start_insn = (b == 0 ? get_insns () : basic_block_head[b]);
2524       stop_insn = target;
2525
2526       if (GET_CODE (start_insn) == INSN
2527           && GET_CODE (PATTERN (start_insn)) == SEQUENCE)
2528         start_insn = XVECEXP (PATTERN (start_insn), 0, 0);
2529
2530       if (GET_CODE (stop_insn) == INSN
2531           && GET_CODE (PATTERN (stop_insn)) == SEQUENCE)
2532         stop_insn = next_insn (PREV_INSN (stop_insn));
2533
2534       for (insn = start_insn; insn != stop_insn;
2535            insn = next_insn_no_annul (insn))
2536         {
2537           rtx link;
2538           rtx real_insn = insn;
2539
2540           /* If this insn is from the target of a branch, it isn't going to
2541              be used in the sequel.  If it is used in both cases, this
2542              test will not be true.  */
2543           if (INSN_FROM_TARGET_P (insn))
2544             continue;
2545
2546           /* If this insn is a USE made by update_block, we care about the
2547              underlying insn.  */
2548           if (GET_CODE (insn) == INSN && GET_CODE (PATTERN (insn)) == USE
2549               && GET_RTX_CLASS (GET_CODE (XEXP (PATTERN (insn), 0))) == 'i')
2550               real_insn = XEXP (PATTERN (insn), 0);
2551
2552           if (GET_CODE (real_insn) == CALL_INSN)
2553             {
2554               /* CALL clobbers all call-used regs that aren't fixed except
2555                  sp, ap, and fp.  Do this before setting the result of the
2556                  call live.  */
2557               for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
2558                 if (call_used_regs[i]
2559                     && i != STACK_POINTER_REGNUM && i != FRAME_POINTER_REGNUM
2560                     && i != ARG_POINTER_REGNUM
2561 #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM
2562                     && i != HARD_FRAME_POINTER_REGNUM
2563 #endif
2564 #if ARG_POINTER_REGNUM != FRAME_POINTER_REGNUM
2565                     && ! (i == ARG_POINTER_REGNUM && fixed_regs[i])
2566 #endif
2567 #ifdef PIC_OFFSET_TABLE_REGNUM
2568                     && ! (i == PIC_OFFSET_TABLE_REGNUM && flag_pic)
2569 #endif
2570                     )
2571                   CLEAR_HARD_REG_BIT (current_live_regs, i);
2572
2573               /* A CALL_INSN sets any global register live, since it may
2574                  have been modified by the call.  */
2575               for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
2576                 if (global_regs[i])
2577                   SET_HARD_REG_BIT (current_live_regs, i);
2578             }
2579
2580           /* Mark anything killed in an insn to be deadened at the next
2581              label.  Ignore USE insns; the only REG_DEAD notes will be for
2582              parameters.  But they might be early.  A CALL_INSN will usually
2583              clobber registers used for parameters.  It isn't worth bothering
2584              with the unlikely case when it won't.  */
2585           if ((GET_CODE (real_insn) == INSN
2586                && GET_CODE (PATTERN (real_insn)) != USE
2587                && GET_CODE (PATTERN (real_insn)) != CLOBBER)
2588               || GET_CODE (real_insn) == JUMP_INSN
2589               || GET_CODE (real_insn) == CALL_INSN)
2590             {
2591               for (link = REG_NOTES (real_insn); link; link = XEXP (link, 1))
2592                 if (REG_NOTE_KIND (link) == REG_DEAD
2593                     && GET_CODE (XEXP (link, 0)) == REG
2594                     && REGNO (XEXP (link, 0)) < FIRST_PSEUDO_REGISTER)
2595                   {
2596                     int first_regno = REGNO (XEXP (link, 0));
2597                     int last_regno
2598                       = (first_regno
2599                          + HARD_REGNO_NREGS (first_regno,
2600                                              GET_MODE (XEXP (link, 0))));
2601
2602                     for (i = first_regno; i < last_regno; i++)
2603                       SET_HARD_REG_BIT (pending_dead_regs, i);
2604                   }
2605
2606               note_stores (PATTERN (real_insn), update_live_status);
2607
2608               /* If any registers were unused after this insn, kill them.
2609                  These notes will always be accurate.  */
2610               for (link = REG_NOTES (real_insn); link; link = XEXP (link, 1))
2611                 if (REG_NOTE_KIND (link) == REG_UNUSED
2612                     && GET_CODE (XEXP (link, 0)) == REG
2613                     && REGNO (XEXP (link, 0)) < FIRST_PSEUDO_REGISTER)
2614                   {
2615                     int first_regno = REGNO (XEXP (link, 0));
2616                     int last_regno
2617                       = (first_regno
2618                          + HARD_REGNO_NREGS (first_regno,
2619                                              GET_MODE (XEXP (link, 0))));
2620
2621                     for (i = first_regno; i < last_regno; i++)
2622                       CLEAR_HARD_REG_BIT (current_live_regs, i);
2623                   }
2624             }
2625
2626           else if (GET_CODE (real_insn) == CODE_LABEL)
2627             {
2628               /* A label clobbers the pending dead registers since neither
2629                  reload nor jump will propagate a value across a label.  */
2630               AND_COMPL_HARD_REG_SET (current_live_regs, pending_dead_regs);
2631               CLEAR_HARD_REG_SET (pending_dead_regs);
2632             }
2633
2634           /* The beginning of the epilogue corresponds to the end of the
2635              RTL chain when there are no epilogue insns.  Certain resources
2636              are implicitly required at that point.  */
2637           else if (GET_CODE (real_insn) == NOTE
2638                    && NOTE_LINE_NUMBER (real_insn) == NOTE_INSN_EPILOGUE_BEG)
2639             IOR_HARD_REG_SET (current_live_regs, start_of_epilogue_needs.regs);
2640         }
2641
2642       COPY_HARD_REG_SET (res->regs, current_live_regs);
2643       tinfo->block = b;
2644       tinfo->bb_tick = bb_ticks[b];
2645     }
2646   else
2647     /* We didn't find the start of a basic block.  Assume everything
2648        in use.  This should happen only extremely rarely.  */
2649     SET_HARD_REG_SET (res->regs);
2650
2651   /* Now step forward from TARGET looking for registers that are set before
2652      they are used.  These are dead.  If we pass a label, any pending dead
2653      registers that weren't yet used can be made dead.  Stop when we pass a
2654      conditional JUMP_INSN; follow the first few unconditional branches.  */
2655
2656   CLEAR_RESOURCE (&set);
2657   CLEAR_RESOURCE (&needed);
2658
2659   for (insn = target; insn; insn = next)
2660     {
2661       rtx this_jump_insn = insn;
2662
2663       next = NEXT_INSN (insn);
2664       switch (GET_CODE (insn))
2665         {
2666         case CODE_LABEL:
2667           AND_COMPL_HARD_REG_SET (pending_dead_regs, needed.regs);
2668           AND_COMPL_HARD_REG_SET (res->regs, pending_dead_regs);
2669           CLEAR_HARD_REG_SET (pending_dead_regs);
2670           continue;
2671
2672         case BARRIER:
2673         case NOTE:
2674           continue;
2675
2676         case INSN:
2677           if (GET_CODE (PATTERN (insn)) == USE)
2678             {
2679               /* If INSN is a USE made by update_block, we care about the
2680                  underlying insn.  Any registers set by the underlying insn
2681                  are live since the insn is being done somewhere else.  */
2682               if (GET_RTX_CLASS (GET_CODE (XEXP (PATTERN (insn), 0))) == 'i')
2683                 mark_set_resources (XEXP (PATTERN (insn), 0), res, 0, 1);
2684
2685               /* All other USE insns are to be ignored.  */
2686               continue;
2687             }
2688           else if (GET_CODE (PATTERN (insn)) == CLOBBER)
2689             continue;
2690           else if (GET_CODE (PATTERN (insn)) == SEQUENCE)
2691             {
2692               /* An unconditional jump can be used to fill the delay slot
2693                  of a call, so search for a JUMP_INSN in any position.  */
2694               for (i = 0; i < XVECLEN (PATTERN (insn), 0); i++)
2695                 {
2696                   this_jump_insn = XVECEXP (PATTERN (insn), 0, i);
2697                   if (GET_CODE (this_jump_insn) == JUMP_INSN)
2698                     break;
2699                 }
2700             }
2701         }
2702
2703       if (GET_CODE (this_jump_insn) == JUMP_INSN)
2704         {
2705           if (jump_count++ < 10
2706               && (simplejump_p (this_jump_insn)
2707                   || GET_CODE (PATTERN (this_jump_insn)) == RETURN))
2708             {
2709               next = next_active_insn (JUMP_LABEL (this_jump_insn));
2710               if (jump_insn == 0)
2711                 {
2712                   jump_insn = insn;
2713                   jump_target = JUMP_LABEL (this_jump_insn);
2714                 }
2715             }
2716           else
2717             break;
2718         }
2719
2720       mark_referenced_resources (insn, &needed, 1);
2721       mark_set_resources (insn, &set, 0, 1);
2722
2723       COPY_HARD_REG_SET (scratch, set.regs);
2724       AND_COMPL_HARD_REG_SET (scratch, needed.regs);
2725       AND_COMPL_HARD_REG_SET (res->regs, scratch);
2726     }
2727
2728   /* If we hit an unconditional branch, we have another way of finding out
2729      what is live: we can see what is live at the branch target and include
2730      anything used but not set before the branch.  The only things that are
2731      live are those that are live using the above test and the test below.
2732
2733      Don't try this if we expired our jump count above, since that would
2734      mean there may be an infinite loop in the function being compiled.  */
2735
2736   if (jump_insn && jump_count < 10)
2737     {
2738       struct resources new_resources;
2739       rtx stop_insn = next_active_insn (jump_insn);
2740
2741       mark_target_live_regs (next_active_insn (jump_target), &new_resources);
2742       CLEAR_RESOURCE (&set);
2743       CLEAR_RESOURCE (&needed);
2744
2745       /* Include JUMP_INSN in the needed registers.  */
2746       for (insn = target; insn != stop_insn; insn = next_active_insn (insn))
2747         {
2748           mark_referenced_resources (insn, &needed, 1);
2749
2750           COPY_HARD_REG_SET (scratch, needed.regs);
2751           AND_COMPL_HARD_REG_SET (scratch, set.regs);
2752           IOR_HARD_REG_SET (new_resources.regs, scratch);
2753
2754           mark_set_resources (insn, &set, 0, 1);
2755         }
2756
2757       AND_HARD_REG_SET (res->regs, new_resources.regs);
2758     }
2759
2760   COPY_HARD_REG_SET (tinfo->live_regs, res->regs);
2761 }
2762 \f
2763 /* Scan a function looking for insns that need a delay slot and find insns to
2764    put into the delay slot.
2765
2766    NON_JUMPS_P is non-zero if we are to only try to fill non-jump insns (such
2767    as calls).  We do these first since we don't want jump insns (that are
2768    easier to fill) to get the only insns that could be used for non-jump insns.
2769    When it is zero, only try to fill JUMP_INSNs.
2770
2771    When slots are filled in this manner, the insns (including the
2772    delay_insn) are put together in a SEQUENCE rtx.  In this fashion,
2773    it is possible to tell whether a delay slot has really been filled
2774    or not.  `final' knows how to deal with this, by communicating
2775    through FINAL_SEQUENCE.  */
2776
2777 static void
2778 fill_simple_delay_slots (first, non_jumps_p)
2779      rtx first;
2780      int non_jumps_p;
2781 {
2782   register rtx insn, pat, trial, next_trial;
2783   register int i, j;
2784   int num_unfilled_slots = unfilled_slots_next - unfilled_slots_base;
2785   struct resources needed, set;
2786   register int slots_to_fill, slots_filled;
2787   rtx delay_list;
2788
2789   for (i = 0; i < num_unfilled_slots; i++)
2790     {
2791       int flags;
2792       /* Get the next insn to fill.  If it has already had any slots assigned,
2793          we can't do anything with it.  Maybe we'll improve this later.  */
2794
2795       insn = unfilled_slots_base[i];
2796       if (insn == 0
2797           || INSN_DELETED_P (insn)
2798           || (GET_CODE (insn) == INSN
2799               && GET_CODE (PATTERN (insn)) == SEQUENCE)
2800           || (GET_CODE (insn) == JUMP_INSN && non_jumps_p)
2801           || (GET_CODE (insn) != JUMP_INSN && ! non_jumps_p))
2802         continue;
2803
2804       if (GET_CODE (insn) == JUMP_INSN)
2805         flags = get_jump_flags (insn, JUMP_LABEL (insn));
2806       else
2807         flags = get_jump_flags (insn, NULL_RTX);
2808       slots_to_fill = num_delay_slots (insn);
2809       if (slots_to_fill == 0)
2810         abort ();
2811
2812       /* This insn needs, or can use, some delay slots.  SLOTS_TO_FILL
2813          says how many.  After initialization, first try optimizing
2814
2815          call _foo              call _foo
2816          nop                    add %o7,.-L1,%o7
2817          b,a L1
2818          nop
2819
2820          If this case applies, the delay slot of the call is filled with
2821          the unconditional jump.  This is done first to avoid having the
2822          delay slot of the call filled in the backward scan.  Also, since
2823          the unconditional jump is likely to also have a delay slot, that
2824          insn must exist when it is subsequently scanned.
2825
2826          This is tried on each insn with delay slots as some machines
2827          have insns which perform calls, but are not represented as
2828          CALL_INSNs.  */
2829
2830       slots_filled = 0;
2831       delay_list = 0;
2832
2833       if ((trial = next_active_insn (insn))
2834           && GET_CODE (trial) == JUMP_INSN
2835           && simplejump_p (trial)
2836           && eligible_for_delay (insn, slots_filled, trial, flags)
2837           && no_labels_between_p (insn, trial))
2838         {
2839           slots_filled++;
2840           delay_list = add_to_delay_list (trial, delay_list);
2841           /* Remove the unconditional jump from consideration for delay slot
2842              filling and unthread it.  */
2843           if (unfilled_slots_base[i + 1] == trial)
2844             unfilled_slots_base[i + 1] = 0;
2845           {
2846             rtx next = NEXT_INSN (trial);
2847             rtx prev = PREV_INSN (trial);
2848             if (prev)
2849               NEXT_INSN (prev) = next;
2850             if (next)
2851               PREV_INSN (next) = prev;
2852           }
2853         }
2854
2855       /* Now, scan backwards from the insn to search for a potential
2856          delay-slot candidate.  Stop searching when a label or jump is hit.
2857
2858          For each candidate, if it is to go into the delay slot (moved
2859          forward in execution sequence), it must not need or set any resources
2860          that were set by later insns and must not set any resources that
2861          are needed for those insns.
2862
2863          The delay slot insn itself sets resources unless it is a call
2864          (in which case the called routine, not the insn itself, is doing
2865          the setting).  */
2866
2867       if (slots_filled < slots_to_fill)
2868         {
2869           CLEAR_RESOURCE (&needed);
2870           CLEAR_RESOURCE (&set);
2871           mark_set_resources (insn, &set, 0, 0);
2872           mark_referenced_resources (insn, &needed, 0);
2873
2874           for (trial = prev_nonnote_insn (insn); ! stop_search_p (trial, 1);
2875                trial = next_trial)
2876             {
2877               next_trial = prev_nonnote_insn (trial);
2878
2879               /* This must be an INSN or CALL_INSN.  */
2880               pat = PATTERN (trial);
2881
2882               /* USE and CLOBBER at this level was just for flow; ignore it.  */
2883               if (GET_CODE (pat) == USE || GET_CODE (pat) == CLOBBER)
2884                 continue;
2885
2886               /* Check for resource conflict first, to avoid unnecessary
2887                  splitting.  */
2888               if (! insn_references_resource_p (trial, &set, 1)
2889                   && ! insn_sets_resource_p (trial, &set, 1)
2890                   && ! insn_sets_resource_p (trial, &needed, 1)
2891 #ifdef HAVE_cc0
2892                   /* Can't separate set of cc0 from its use.  */
2893                   && ! (reg_mentioned_p (cc0_rtx, pat)
2894                         && ! sets_cc0_p (cc0_rtx, pat))
2895 #endif
2896                   )
2897                 {
2898                   trial = try_split (pat, trial, 1);
2899                   next_trial = prev_nonnote_insn (trial);
2900                   if (eligible_for_delay (insn, slots_filled, trial, flags))
2901                     {
2902                       /* In this case, we are searching backward, so if we
2903                          find insns to put on the delay list, we want
2904                          to put them at the head, rather than the
2905                          tail, of the list.  */
2906
2907                       update_reg_dead_notes (trial, insn);
2908                       delay_list = gen_rtx (INSN_LIST, VOIDmode,
2909                                             trial, delay_list);
2910                       update_block (trial, trial);
2911                       delete_insn (trial);
2912                       if (slots_to_fill == ++slots_filled)
2913                         break;
2914                       continue;
2915                     }
2916                 }
2917
2918               mark_set_resources (trial, &set, 0, 1);
2919               mark_referenced_resources (trial, &needed, 1);
2920             }
2921         }
2922
2923       /* If all needed slots haven't been filled, we come here.  */
2924
2925       /* Try to optimize case of jumping around a single insn.  */
2926 #if defined(ANNUL_IFFALSE_SLOTS) || defined(ANNUL_IFTRUE_SLOTS)
2927       if (slots_filled != slots_to_fill
2928           && delay_list == 0
2929           && GET_CODE (insn) == JUMP_INSN
2930           && (condjump_p (insn) || condjump_in_parallel_p (insn)))
2931         {
2932           delay_list = optimize_skip (insn);
2933           if (delay_list)
2934             slots_filled += 1;
2935         }
2936 #endif
2937
2938       /* Try to get insns from beyond the insn needing the delay slot.
2939          These insns can neither set or reference resources set in insns being
2940          skipped, cannot set resources in the insn being skipped, and, if this
2941          is a CALL_INSN (or a CALL_INSN is passed), cannot trap (because the
2942          call might not return).
2943
2944          If this is a conditional jump, see if it merges back to us early
2945          enough for us to pick up insns from the merge point.  Don't do
2946          this if there is another branch to our label unless we pass all of
2947          them.
2948
2949          Another similar merge is if we jump to the same place that a
2950          later unconditional jump branches to.  In that case, we don't
2951          care about the number of uses of our label.  */
2952
2953       if (slots_filled != slots_to_fill
2954           && (GET_CODE (insn) != JUMP_INSN
2955               || ((condjump_p (insn) || condjump_in_parallel_p (insn))
2956                    && ! simplejump_p (insn)
2957                    && JUMP_LABEL (insn) != 0)))
2958         {
2959           rtx target = 0;
2960           int maybe_never = 0;
2961           int passed_label = 0;
2962           int target_uses;
2963           struct resources needed_at_jump;
2964
2965           CLEAR_RESOURCE (&needed);
2966           CLEAR_RESOURCE (&set);
2967
2968           if (GET_CODE (insn) == CALL_INSN)
2969             {
2970               mark_set_resources (insn, &set, 0, 1);
2971               mark_referenced_resources (insn, &needed, 1);
2972               maybe_never = 1;
2973             }
2974           else
2975             {
2976               mark_set_resources (insn, &set, 0, 1);
2977               mark_referenced_resources (insn, &needed, 1);
2978               if (GET_CODE (insn) == JUMP_INSN)
2979                 {
2980                   /* Get our target and show how many more uses we want to
2981                      see before we hit the label.  */
2982                   target = JUMP_LABEL (insn);
2983                   target_uses = LABEL_NUSES (target) - 1;
2984                 }
2985
2986             }
2987
2988           for (trial = next_nonnote_insn (insn); trial; trial = next_trial)
2989             {
2990               rtx pat, trial_delay;
2991
2992               next_trial = next_nonnote_insn (trial);
2993
2994               if (GET_CODE (trial) == CODE_LABEL)
2995                 {
2996                   passed_label = 1;
2997
2998                   /* If this is our target, see if we have seen all its uses.
2999                      If so, indicate we have passed our target and ignore it.
3000                      All other labels cause us to stop our search.  */
3001                   if (trial == target && target_uses == 0)
3002                     {
3003                       target = 0;
3004                       continue;
3005                     }
3006                   else
3007                     break;
3008                 }
3009               else if (GET_CODE (trial) == BARRIER)
3010                 break;
3011
3012               /* We must have an INSN, JUMP_INSN, or CALL_INSN.  */
3013               pat = PATTERN (trial);
3014
3015               /* Stand-alone USE and CLOBBER are just for flow.  */
3016               if (GET_CODE (pat) == USE || GET_CODE (pat) == CLOBBER)
3017                 continue;
3018
3019               /* If this already has filled delay slots, get the insn needing
3020                  the delay slots.  */
3021               if (GET_CODE (pat) == SEQUENCE)
3022                 trial_delay = XVECEXP (pat, 0, 0);
3023               else
3024                 trial_delay = trial;
3025
3026               /* If this is a jump insn to our target, indicate that we have
3027                  seen another jump to it.  If we aren't handling a conditional
3028                  jump, stop our search. Otherwise, compute the needs at its
3029                  target and add them to NEEDED.  */
3030               if (GET_CODE (trial_delay) == JUMP_INSN)
3031                 {
3032                   if (target == 0)
3033                     break;
3034                   else if (JUMP_LABEL (trial_delay) == target)
3035                     target_uses--;
3036                   else
3037                     {
3038                       mark_target_live_regs
3039                         (next_active_insn (JUMP_LABEL (trial_delay)),
3040                          &needed_at_jump);
3041                       needed.memory |= needed_at_jump.memory;
3042                       IOR_HARD_REG_SET (needed.regs, needed_at_jump.regs);
3043                     }
3044                 }
3045
3046               /* See if we have a resource problem before we try to
3047                  split.   */
3048               if (target == 0
3049                   && GET_CODE (pat) != SEQUENCE
3050                   && ! insn_references_resource_p (trial, &set, 1)
3051                   && ! insn_sets_resource_p (trial, &set, 1)
3052                   && ! insn_sets_resource_p (trial, &needed, 1)
3053 #ifdef HAVE_cc0
3054                   && ! (reg_mentioned_p (cc0_rtx, pat) && ! sets_cc0_p (pat))
3055 #endif
3056                   && ! (maybe_never && may_trap_p (pat))
3057                   && (trial = try_split (pat, trial, 0))
3058                   && eligible_for_delay (insn, slots_filled, trial, flags))
3059                 {
3060                   next_trial = next_nonnote_insn (trial);
3061                   delay_list = add_to_delay_list (trial, delay_list);
3062
3063 #ifdef HAVE_cc0
3064                   if (reg_mentioned_p (cc0_rtx, pat))
3065                     link_cc0_insns (trial);
3066 #endif
3067
3068                   if (passed_label)
3069                     update_block (trial, trial);
3070                   delete_insn (trial);
3071                   if (slots_to_fill == ++slots_filled)
3072                     break;
3073                   continue;
3074                 }
3075
3076               mark_set_resources (trial, &set, 0, 1);
3077               mark_referenced_resources (trial, &needed, 1);
3078
3079               /* Ensure we don't put insns between the setting of cc and the
3080                  comparison by moving a setting of cc into an earlier delay
3081                  slot since these insns could clobber the condition code.  */
3082               set.cc = 1;
3083
3084               /* If this is a call or jump, we might not get here.  */
3085               if (GET_CODE (trial) == CALL_INSN
3086                   || GET_CODE (trial) == JUMP_INSN)
3087                 maybe_never = 1;
3088             }
3089
3090           /* If there are slots left to fill and our search was stopped by an
3091              unconditional branch, try the insn at the branch target.  We can
3092              redirect the branch if it works.  */
3093           if (slots_to_fill != slots_filled
3094               && trial
3095               && GET_CODE (trial) == JUMP_INSN
3096               && simplejump_p (trial)
3097               && (target == 0 || JUMP_LABEL (trial) == target)
3098               && (next_trial = next_active_insn (JUMP_LABEL (trial))) != 0
3099               && ! (GET_CODE (next_trial) == INSN
3100                     && GET_CODE (PATTERN (next_trial)) == SEQUENCE)
3101               && ! insn_references_resource_p (next_trial, &set, 1)
3102               && ! insn_sets_resource_p (next_trial, &set, 1)
3103               && ! insn_sets_resource_p (next_trial, &needed, 1)
3104 #ifdef HAVE_cc0
3105               && ! reg_mentioned_p (cc0_rtx, PATTERN (next_trial))
3106 #endif
3107               && ! (maybe_never && may_trap_p (PATTERN (next_trial)))
3108               && (next_trial = try_split (PATTERN (next_trial), next_trial, 0))
3109               && eligible_for_delay (insn, slots_filled, next_trial, flags))
3110             {
3111               rtx new_label = next_active_insn (next_trial);
3112
3113               if (new_label != 0)
3114                 new_label = get_label_before (new_label);
3115               else
3116                 new_label = find_end_label ();
3117
3118               delay_list
3119                 = add_to_delay_list (copy_rtx (next_trial), delay_list);
3120               slots_filled++;
3121               reorg_redirect_jump (trial, new_label);
3122
3123               /* If we merged because we both jumped to the same place,
3124                  redirect the original insn also.  */
3125               if (target)
3126                 reorg_redirect_jump (insn, new_label);
3127             }
3128         }
3129
3130       if (delay_list)
3131         unfilled_slots_base[i]
3132           = emit_delay_sequence (insn, delay_list,
3133                                  slots_filled, slots_to_fill);
3134
3135       if (slots_to_fill == slots_filled)
3136         unfilled_slots_base[i] = 0;
3137
3138       note_delay_statistics (slots_filled, 0);
3139     }
3140
3141 #ifdef DELAY_SLOTS_FOR_EPILOGUE
3142   /* See if the epilogue needs any delay slots.  Try to fill them if so.
3143      The only thing we can do is scan backwards from the end of the
3144      function.  If we did this in a previous pass, it is incorrect to do it
3145      again.  */
3146   if (current_function_epilogue_delay_list)
3147     return;
3148
3149   slots_to_fill = DELAY_SLOTS_FOR_EPILOGUE;
3150   if (slots_to_fill == 0)
3151     return;
3152
3153   slots_filled = 0;
3154   CLEAR_RESOURCE (&set);
3155
3156   /* The frame pointer and stack pointer are needed at the beginning of
3157      the epilogue, so instructions setting them can not be put in the
3158      epilogue delay slot.  However, everything else needed at function
3159      end is safe, so we don't want to use end_of_function_needs here.  */
3160   CLEAR_RESOURCE (&needed);
3161   if (frame_pointer_needed)
3162     {
3163       SET_HARD_REG_BIT (needed.regs, FRAME_POINTER_REGNUM);
3164 #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM
3165       SET_HARD_REG_BIT (needed.regs, HARD_FRAME_POINTER_REGNUM);
3166 #endif
3167 #ifdef EXIT_IGNORE_STACK
3168       if (! EXIT_IGNORE_STACK)
3169 #endif
3170         SET_HARD_REG_BIT (needed.regs, STACK_POINTER_REGNUM);
3171     }
3172   else
3173     SET_HARD_REG_BIT (needed.regs, STACK_POINTER_REGNUM);
3174
3175   for (trial = get_last_insn (); ! stop_search_p (trial, 1);
3176        trial = PREV_INSN (trial))
3177     {
3178       if (GET_CODE (trial) == NOTE)
3179         continue;
3180       pat = PATTERN (trial);
3181       if (GET_CODE (pat) == USE || GET_CODE (pat) == CLOBBER)
3182         continue;
3183
3184       if (! insn_references_resource_p (trial, &set, 1)
3185           && ! insn_sets_resource_p (trial, &needed, 1)
3186           && ! insn_sets_resource_p (trial, &set, 1)
3187 #ifdef HAVE_cc0
3188           /* Don't want to mess with cc0 here.  */
3189           && ! reg_mentioned_p (cc0_rtx, pat)
3190 #endif
3191           )
3192         {
3193           trial = try_split (pat, trial, 1);
3194           if (ELIGIBLE_FOR_EPILOGUE_DELAY (trial, slots_filled))
3195             {
3196               /* Here as well we are searching backward, so put the
3197                  insns we find on the head of the list.  */
3198
3199               current_function_epilogue_delay_list
3200                 = gen_rtx (INSN_LIST, VOIDmode, trial,
3201                            current_function_epilogue_delay_list);
3202               mark_referenced_resources (trial, &end_of_function_needs, 1);
3203               update_block (trial, trial);
3204               delete_insn (trial);
3205
3206               /* Clear deleted bit so final.c will output the insn.  */
3207               INSN_DELETED_P (trial) = 0;
3208
3209               if (slots_to_fill == ++slots_filled)
3210                 break;
3211               continue;
3212             }
3213         }
3214
3215       mark_set_resources (trial, &set, 0, 1);
3216       mark_referenced_resources (trial, &needed, 1);
3217     }
3218
3219   note_delay_statistics (slots_filled, 0);
3220 #endif
3221 }
3222 \f
3223 /* Try to find insns to place in delay slots.
3224
3225    INSN is the jump needing SLOTS_TO_FILL delay slots.  It tests CONDITION
3226    or is an unconditional branch if CONDITION is const_true_rtx.
3227    *PSLOTS_FILLED is updated with the number of slots that we have filled.
3228
3229    THREAD is a flow-of-control, either the insns to be executed if the
3230    branch is true or if the branch is false, THREAD_IF_TRUE says which.
3231
3232    OPPOSITE_THREAD is the thread in the opposite direction.  It is used
3233    to see if any potential delay slot insns set things needed there.
3234
3235    LIKELY is non-zero if it is extremely likely that the branch will be
3236    taken and THREAD_IF_TRUE is set.  This is used for the branch at the
3237    end of a loop back up to the top.
3238
3239    OWN_THREAD and OWN_OPPOSITE_THREAD are true if we are the only user of the
3240    thread.  I.e., it is the fallthrough code of our jump or the target of the
3241    jump when we are the only jump going there.
3242
3243    If OWN_THREAD is false, it must be the "true" thread of a jump.  In that
3244    case, we can only take insns from the head of the thread for our delay
3245    slot.  We then adjust the jump to point after the insns we have taken.  */
3246
3247 static rtx
3248 fill_slots_from_thread (insn, condition, thread, opposite_thread, likely,
3249                         thread_if_true, own_thread, own_opposite_thread,
3250                         slots_to_fill, pslots_filled)
3251      rtx insn;
3252      rtx condition;
3253      rtx thread, opposite_thread;
3254      int likely;
3255      int thread_if_true;
3256      int own_thread, own_opposite_thread;
3257      int slots_to_fill, *pslots_filled;
3258 {
3259   rtx new_thread;
3260   rtx delay_list = 0;
3261   struct resources opposite_needed, set, needed;
3262   rtx trial;
3263   int lose = 0;
3264   int must_annul = 0;
3265   int flags;
3266
3267   /* Validate our arguments.  */
3268   if ((condition == const_true_rtx && ! thread_if_true)
3269       || (! own_thread && ! thread_if_true))
3270     abort ();
3271
3272   flags = get_jump_flags (insn, JUMP_LABEL (insn));
3273
3274   /* If our thread is the end of subroutine, we can't get any delay
3275      insns from that.  */
3276   if (thread == 0)
3277     return 0;
3278
3279   /* If this is an unconditional branch, nothing is needed at the
3280      opposite thread.  Otherwise, compute what is needed there.  */
3281   if (condition == const_true_rtx)
3282     CLEAR_RESOURCE (&opposite_needed);
3283   else
3284     mark_target_live_regs (opposite_thread, &opposite_needed);
3285
3286   /* If the insn at THREAD can be split, do it here to avoid having to
3287      update THREAD and NEW_THREAD if it is done in the loop below.  Also
3288      initialize NEW_THREAD.  */
3289
3290   new_thread = thread = try_split (PATTERN (thread), thread, 0);
3291
3292   /* Scan insns at THREAD.  We are looking for an insn that can be removed
3293      from THREAD (it neither sets nor references resources that were set
3294      ahead of it and it doesn't set anything needs by the insns ahead of
3295      it) and that either can be placed in an annulling insn or aren't
3296      needed at OPPOSITE_THREAD.  */
3297
3298   CLEAR_RESOURCE (&needed);
3299   CLEAR_RESOURCE (&set);
3300
3301   /* If we do not own this thread, we must stop as soon as we find
3302      something that we can't put in a delay slot, since all we can do
3303      is branch into THREAD at a later point.  Therefore, labels stop
3304      the search if this is not the `true' thread.  */
3305
3306   for (trial = thread;
3307        ! stop_search_p (trial, ! thread_if_true) && (! lose || own_thread);
3308        trial = next_nonnote_insn (trial))
3309     {
3310       rtx pat, old_trial;
3311
3312       /* If we have passed a label, we no longer own this thread.  */
3313       if (GET_CODE (trial) == CODE_LABEL)
3314         {
3315           own_thread = 0;
3316           continue;
3317         }
3318
3319       pat = PATTERN (trial);
3320       if (GET_CODE (pat) == USE || GET_CODE (pat) == CLOBBER)
3321         continue;
3322
3323       /* If TRIAL conflicts with the insns ahead of it, we lose.  Also,
3324          don't separate or copy insns that set and use CC0.  */
3325       if (! insn_references_resource_p (trial, &set, 1)
3326           && ! insn_sets_resource_p (trial, &set, 1)
3327           && ! insn_sets_resource_p (trial, &needed, 1)
3328 #ifdef HAVE_cc0
3329           && ! (reg_mentioned_p (cc0_rtx, pat)
3330                 && (! own_thread || ! sets_cc0_p (pat)))
3331 #endif
3332           )
3333         {
3334           rtx prior_insn;
3335
3336           /* If TRIAL is redundant with some insn before INSN, we don't
3337              actually need to add it to the delay list; we can merely pretend
3338              we did.  */
3339           if (prior_insn = redundant_insn (trial, insn, delay_list))
3340             {
3341               if (own_thread)
3342                 {
3343                   update_block (trial, thread);
3344                   if (trial == thread)
3345                     {
3346                       thread = next_active_insn (thread);
3347                       if (new_thread == trial)
3348                         new_thread = thread;
3349                     }
3350
3351                   delete_insn (trial);
3352                 }
3353               else
3354                 {
3355                   update_reg_unused_notes (prior_insn, trial);
3356                   new_thread = next_active_insn (trial);
3357                 }
3358
3359               continue;
3360             }
3361
3362           /* There are two ways we can win:  If TRIAL doesn't set anything
3363              needed at the opposite thread and can't trap, or if it can
3364              go into an annulled delay slot.  */
3365           if (condition == const_true_rtx
3366               || (! insn_sets_resource_p (trial, &opposite_needed, 1)
3367                   && ! may_trap_p (pat)))
3368             {
3369               old_trial = trial;
3370               trial = try_split (pat, trial, 0);
3371               if (new_thread == old_trial)
3372                 new_thread = trial;
3373               if (thread == old_trial)
3374                 thread = trial;
3375               pat = PATTERN (trial);
3376               if (eligible_for_delay (insn, *pslots_filled, trial, flags))
3377                 goto winner;
3378             }
3379           else if (0
3380 #ifdef ANNUL_IFTRUE_SLOTS
3381                    || ! thread_if_true
3382 #endif
3383 #ifdef ANNUL_IFFALSE_SLOTS
3384                    || thread_if_true
3385 #endif
3386                    )
3387             {
3388               old_trial = trial;
3389               trial = try_split (pat, trial, 0);
3390               if (new_thread == old_trial)
3391                 new_thread = trial;
3392               pat = PATTERN (trial);
3393               if ((thread_if_true
3394                    ? eligible_for_annul_false (insn, *pslots_filled, trial, flags)
3395                    : eligible_for_annul_true (insn, *pslots_filled, trial, flags)))
3396                 {
3397                   rtx temp;
3398
3399                   must_annul = 1;
3400                 winner:
3401
3402 #ifdef HAVE_cc0
3403                   if (reg_mentioned_p (cc0_rtx, pat))
3404                     link_cc0_insns (trial);
3405 #endif
3406
3407                   /* If we own this thread, delete the insn.  If this is the
3408                      destination of a branch, show that a basic block status
3409                      may have been updated.  In any case, mark the new
3410                      starting point of this thread.  */
3411                   if (own_thread)
3412                     {
3413                       update_block (trial, thread);
3414                       delete_insn (trial);
3415                     }
3416                   else
3417                     new_thread = next_active_insn (trial);
3418
3419                   temp = own_thread ? trial : copy_rtx (trial);
3420                   if (thread_if_true)
3421                     INSN_FROM_TARGET_P (temp) = 1;
3422
3423                   delay_list = add_to_delay_list (temp, delay_list);
3424
3425                   if (slots_to_fill == ++(*pslots_filled))
3426                     {
3427                       /* Even though we have filled all the slots, we
3428                          may be branching to a location that has a
3429                          redundant insn.  Skip any if so.  */
3430                       while (new_thread && ! own_thread
3431                              && ! insn_sets_resource_p (new_thread, &set, 1)
3432                              && ! insn_sets_resource_p (new_thread, &needed, 1)
3433                              && ! insn_references_resource_p (new_thread,
3434                                                               &set, 1)
3435                              && redundant_insn (new_thread, insn, delay_list))
3436                         new_thread = next_active_insn (new_thread);
3437                       break;
3438                     }
3439
3440                   continue;
3441                 }
3442             }
3443         }
3444
3445       /* This insn can't go into a delay slot.  */
3446       lose = 1;
3447       mark_set_resources (trial, &set, 0, 1);
3448       mark_referenced_resources (trial, &needed, 1);
3449
3450       /* Ensure we don't put insns between the setting of cc and the comparison
3451          by moving a setting of cc into an earlier delay slot since these insns
3452          could clobber the condition code.  */
3453       set.cc = 1;
3454
3455       /* If this insn is a register-register copy and the next insn has
3456          a use of our destination, change it to use our source.  That way,
3457          it will become a candidate for our delay slot the next time
3458          through this loop.  This case occurs commonly in loops that
3459          scan a list.
3460
3461          We could check for more complex cases than those tested below,
3462          but it doesn't seem worth it.  It might also be a good idea to try
3463          to swap the two insns.  That might do better.
3464
3465          We can't do this if the next insn modifies our destination, because
3466          that would make the replacement into the insn invalid.  We also can't
3467          do this if it modifies our source, because it might be an earlyclobber
3468          operand.  This latter test also prevents updating the contents of
3469          a PRE_INC.  */
3470
3471       if (GET_CODE (trial) == INSN && GET_CODE (pat) == SET
3472           && GET_CODE (SET_SRC (pat)) == REG
3473           && GET_CODE (SET_DEST (pat)) == REG)
3474         {
3475           rtx next = next_nonnote_insn (trial);
3476
3477           if (next && GET_CODE (next) == INSN
3478               && GET_CODE (PATTERN (next)) != USE
3479               && ! reg_set_p (SET_DEST (pat), next)
3480               && ! reg_set_p (SET_SRC (pat), next)
3481               && reg_referenced_p (SET_DEST (pat), PATTERN (next)))
3482             validate_replace_rtx (SET_DEST (pat), SET_SRC (pat), next);
3483         }
3484     }
3485
3486   /* If we stopped on a branch insn that has delay slots, see if we can
3487      steal some of the insns in those slots.  */
3488   if (trial && GET_CODE (trial) == INSN
3489       && GET_CODE (PATTERN (trial)) == SEQUENCE
3490       && GET_CODE (XVECEXP (PATTERN (trial), 0, 0)) == JUMP_INSN)
3491     {
3492       /* If this is the `true' thread, we will want to follow the jump,
3493          so we can only do this if we have taken everything up to here.  */
3494       if (thread_if_true && trial == new_thread)
3495         delay_list
3496           = steal_delay_list_from_target (insn, condition, PATTERN (trial),
3497                                           delay_list, &set, &needed,
3498                                           &opposite_needed, slots_to_fill,
3499                                           pslots_filled, &must_annul,
3500                                           &new_thread);
3501       else if (! thread_if_true)
3502         delay_list
3503           = steal_delay_list_from_fallthrough (insn, condition,
3504                                                PATTERN (trial),
3505                                                delay_list, &set, &needed,
3506                                                &opposite_needed, slots_to_fill,
3507                                                pslots_filled, &must_annul);
3508     }
3509
3510   /* If we haven't found anything for this delay slot and it is very
3511      likely that the branch will be taken, see if the insn at our target
3512      increments or decrements a register with an increment that does not
3513      depend on the destination register.  If so, try to place the opposite
3514      arithmetic insn after the jump insn and put the arithmetic insn in the
3515      delay slot.  If we can't do this, return.  */
3516   if (delay_list == 0 && likely && new_thread && GET_CODE (new_thread) == INSN)
3517     {
3518       rtx pat = PATTERN (new_thread);
3519       rtx dest;
3520       rtx src;
3521
3522       trial = new_thread;
3523       pat = PATTERN (trial);
3524
3525       if (GET_CODE (trial) != INSN || GET_CODE (pat) != SET
3526           || ! eligible_for_delay (insn, 0, trial, flags))
3527         return 0;
3528
3529       dest = SET_DEST (pat), src = SET_SRC (pat);
3530       if ((GET_CODE (src) == PLUS || GET_CODE (src) == MINUS)
3531           && rtx_equal_p (XEXP (src, 0), dest)
3532           && ! reg_overlap_mentioned_p (dest, XEXP (src, 1)))
3533         {
3534           rtx other = XEXP (src, 1);
3535           rtx new_arith;
3536           rtx ninsn;
3537
3538           /* If this is a constant adjustment, use the same code with
3539              the negated constant.  Otherwise, reverse the sense of the
3540              arithmetic.  */
3541           if (GET_CODE (other) == CONST_INT)
3542             new_arith = gen_rtx (GET_CODE (src), GET_MODE (src), dest,
3543                                  negate_rtx (GET_MODE (src), other));
3544           else
3545             new_arith = gen_rtx (GET_CODE (src) == PLUS ? MINUS : PLUS,
3546                                  GET_MODE (src), dest, other);
3547
3548           ninsn = emit_insn_after (gen_rtx (SET, VOIDmode, dest, new_arith),
3549                                    insn);
3550
3551           if (recog_memoized (ninsn) < 0
3552               || (insn_extract (ninsn),
3553                   ! constrain_operands (INSN_CODE (ninsn), 1)))
3554             {
3555               delete_insn (ninsn);
3556               return 0;
3557             }
3558
3559           if (own_thread)
3560             {
3561               update_block (trial, thread);
3562               delete_insn (trial);
3563             }
3564           else
3565             new_thread = next_active_insn (trial);
3566
3567           ninsn = own_thread ? trial : copy_rtx (trial);
3568           if (thread_if_true)
3569             INSN_FROM_TARGET_P (ninsn) = 1;
3570
3571           delay_list = add_to_delay_list (ninsn, NULL_RTX);
3572           (*pslots_filled)++;
3573         }
3574     }
3575
3576   if (delay_list && must_annul)
3577     INSN_ANNULLED_BRANCH_P (insn) = 1;
3578
3579   /* If we are to branch into the middle of this thread, find an appropriate
3580      label or make a new one if none, and redirect INSN to it.  If we hit the
3581      end of the function, use the end-of-function label.  */
3582   if (new_thread != thread)
3583     {
3584       rtx label;
3585
3586       if (! thread_if_true)
3587         abort ();
3588
3589       if (new_thread && GET_CODE (new_thread) == JUMP_INSN
3590           && (simplejump_p (new_thread)
3591               || GET_CODE (PATTERN (new_thread)) == RETURN)
3592           && redirect_with_delay_list_safe_p (insn,
3593                                               JUMP_LABEL (new_thread),
3594                                               delay_list))
3595         new_thread = follow_jumps (JUMP_LABEL (new_thread));
3596
3597       if (new_thread == 0)
3598         label = find_end_label ();
3599       else if (GET_CODE (new_thread) == CODE_LABEL)
3600         label = new_thread;
3601       else
3602         label = get_label_before (new_thread);
3603
3604       reorg_redirect_jump (insn, label);
3605     }
3606
3607   return delay_list;
3608 }
3609 \f
3610 /* Make another attempt to find insns to place in delay slots.
3611
3612    We previously looked for insns located in front of the delay insn
3613    and, for non-jump delay insns, located behind the delay insn.
3614
3615    Here only try to schedule jump insns and try to move insns from either
3616    the target or the following insns into the delay slot.  If annulling is
3617    supported, we will be likely to do this.  Otherwise, we can do this only
3618    if safe.  */
3619
3620 static void
3621 fill_eager_delay_slots (first)
3622      rtx first;
3623 {
3624   register rtx insn;
3625   register int i;
3626   int num_unfilled_slots = unfilled_slots_next - unfilled_slots_base;
3627
3628   for (i = 0; i < num_unfilled_slots; i++)
3629     {
3630       rtx condition;
3631       rtx target_label, insn_at_target, fallthrough_insn;
3632       rtx delay_list = 0;
3633       int own_target;
3634       int own_fallthrough;
3635       int prediction, slots_to_fill, slots_filled;
3636
3637       insn = unfilled_slots_base[i];
3638       if (insn == 0
3639           || INSN_DELETED_P (insn)
3640           || GET_CODE (insn) != JUMP_INSN
3641           || ! (condjump_p (insn) || condjump_in_parallel_p (insn)))
3642         continue;
3643
3644       slots_to_fill = num_delay_slots (insn);
3645       if (slots_to_fill == 0)
3646         abort ();
3647
3648       slots_filled = 0;
3649       target_label = JUMP_LABEL (insn);
3650       condition = get_branch_condition (insn, target_label);
3651
3652       if (condition == 0)
3653         continue;
3654
3655       /* Get the next active fallthough and target insns and see if we own
3656          them.  Then see whether the branch is likely true.  We don't need
3657          to do a lot of this for unconditional branches.  */
3658
3659       insn_at_target = next_active_insn (target_label);
3660       own_target = own_thread_p (target_label, target_label, 0);
3661
3662       if (condition == const_true_rtx)
3663         {
3664           own_fallthrough = 0;
3665           fallthrough_insn = 0;
3666           prediction = 2;
3667         }
3668       else
3669         {
3670           fallthrough_insn = next_active_insn (insn);
3671           own_fallthrough = own_thread_p (NEXT_INSN (insn), NULL_RTX, 1);
3672           prediction = mostly_true_jump (insn, condition);
3673         }
3674
3675       /* If this insn is expected to branch, first try to get insns from our
3676          target, then our fallthrough insns.  If it is not, expected to branch,
3677          try the other order.  */
3678
3679       if (prediction > 0)
3680         {
3681           delay_list
3682             = fill_slots_from_thread (insn, condition, insn_at_target,
3683                                       fallthrough_insn, prediction == 2, 1,
3684                                       own_target, own_fallthrough,
3685                                       slots_to_fill, &slots_filled);
3686
3687           if (delay_list == 0 && own_fallthrough)
3688             {
3689               /* Even though we didn't find anything for delay slots,
3690                  we might have found a redundant insn which we deleted
3691                  from the thread that was filled.  So we have to recompute
3692                  the next insn at the target.  */
3693               target_label = JUMP_LABEL (insn);
3694               insn_at_target = next_active_insn (target_label);
3695
3696               delay_list
3697                 = fill_slots_from_thread (insn, condition, fallthrough_insn,
3698                                           insn_at_target, 0, 0,
3699                                           own_fallthrough, own_target,
3700                                           slots_to_fill, &slots_filled);
3701             }
3702         }
3703       else
3704         {
3705           if (own_fallthrough)
3706             delay_list
3707               = fill_slots_from_thread (insn, condition, fallthrough_insn,
3708                                         insn_at_target, 0, 0,
3709                                         own_fallthrough, own_target,
3710                                         slots_to_fill, &slots_filled);
3711
3712           if (delay_list == 0)
3713             delay_list
3714               = fill_slots_from_thread (insn, condition, insn_at_target,
3715                                         next_active_insn (insn), 0, 1,
3716                                         own_target, own_fallthrough,
3717                                         slots_to_fill, &slots_filled);
3718         }
3719
3720       if (delay_list)
3721         unfilled_slots_base[i]
3722           = emit_delay_sequence (insn, delay_list,
3723                                  slots_filled, slots_to_fill);
3724
3725       if (slots_to_fill == slots_filled)
3726         unfilled_slots_base[i] = 0;
3727
3728       note_delay_statistics (slots_filled, 1);
3729     }
3730 }
3731 \f
3732 /* Once we have tried two ways to fill a delay slot, make a pass over the
3733    code to try to improve the results and to do such things as more jump
3734    threading.  */
3735
3736 static void
3737 relax_delay_slots (first)
3738      rtx first;
3739 {
3740   register rtx insn, next, pat;
3741   register rtx trial, delay_insn, target_label;
3742
3743   /* Look at every JUMP_INSN and see if we can improve it.  */
3744   for (insn = first; insn; insn = next)
3745     {
3746       rtx other;
3747
3748       next = next_active_insn (insn);
3749
3750       /* If this is a jump insn, see if it now jumps to a jump, jumps to
3751          the next insn, or jumps to a label that is not the last of a
3752          group of consecutive labels.  */
3753       if (GET_CODE (insn) == JUMP_INSN
3754           && (condjump_p (insn) || condjump_in_parallel_p (insn))
3755           && (target_label = JUMP_LABEL (insn)) != 0)
3756         {
3757           target_label = follow_jumps (target_label);
3758           target_label = prev_label (next_active_insn (target_label));
3759
3760           if (target_label == 0)
3761             target_label = find_end_label ();
3762
3763           if (next_active_insn (target_label) == next
3764               && ! condjump_in_parallel_p (insn))
3765             {
3766               delete_jump (insn);
3767               continue;
3768             }
3769
3770           if (target_label != JUMP_LABEL (insn))
3771             reorg_redirect_jump (insn, target_label);
3772
3773           /* See if this jump branches around a unconditional jump.
3774              If so, invert this jump and point it to the target of the
3775              second jump.  */
3776           if (next && GET_CODE (next) == JUMP_INSN
3777               && (simplejump_p (next) || GET_CODE (PATTERN (next)) == RETURN)
3778               && next_active_insn (target_label) == next_active_insn (next)
3779               && no_labels_between_p (insn, next))
3780             {
3781               rtx label = JUMP_LABEL (next);
3782
3783               /* Be careful how we do this to avoid deleting code or
3784                  labels that are momentarily dead.  See similar optimization
3785                  in jump.c.
3786
3787                  We also need to ensure we properly handle the case when
3788                  invert_jump fails.  */
3789
3790               ++LABEL_NUSES (target_label);
3791               if (label)
3792                 ++LABEL_NUSES (label);
3793
3794               if (invert_jump (insn, label))
3795                 {
3796                   delete_insn (next);
3797                   next = insn;
3798                 }
3799
3800               if (label)
3801                 --LABEL_NUSES (label);
3802
3803               if (--LABEL_NUSES (target_label) == 0)
3804                 delete_insn (target_label);
3805
3806               continue;
3807             }
3808         }
3809
3810       /* If this is an unconditional jump and the previous insn is a
3811          conditional jump, try reversing the condition of the previous
3812          insn and swapping our targets.  The next pass might be able to
3813          fill the slots.
3814
3815          Don't do this if we expect the conditional branch to be true, because
3816          we would then be making the more common case longer.  */
3817
3818       if (GET_CODE (insn) == JUMP_INSN
3819           && (simplejump_p (insn) || GET_CODE (PATTERN (insn)) == RETURN)
3820           && (other = prev_active_insn (insn)) != 0
3821           && (condjump_p (other) || condjump_in_parallel_p (other))
3822           && no_labels_between_p (other, insn)
3823           && 0 < mostly_true_jump (other,
3824                                    get_branch_condition (other,
3825                                                          JUMP_LABEL (other))))
3826         {
3827           rtx other_target = JUMP_LABEL (other);
3828           target_label = JUMP_LABEL (insn);
3829
3830           /* Increment the count of OTHER_TARGET, so it doesn't get deleted
3831              as we move the label.  */
3832           if (other_target)
3833             ++LABEL_NUSES (other_target);
3834
3835           if (invert_jump (other, target_label))
3836             reorg_redirect_jump (insn, other_target);
3837
3838           if (other_target)
3839             --LABEL_NUSES (other_target);
3840         }
3841
3842       /* Now look only at cases where we have filled a delay slot.  */
3843       if (GET_CODE (insn) != INSN
3844           || GET_CODE (PATTERN (insn)) != SEQUENCE)
3845         continue;
3846
3847       pat = PATTERN (insn);
3848       delay_insn = XVECEXP (pat, 0, 0);
3849
3850       /* See if the first insn in the delay slot is redundant with some
3851          previous insn.  Remove it from the delay slot if so; then set up
3852          to reprocess this insn.  */
3853       if (redundant_insn (XVECEXP (pat, 0, 1), delay_insn, 0))
3854         {
3855           delete_from_delay_slot (XVECEXP (pat, 0, 1));
3856           next = prev_active_insn (next);
3857           continue;
3858         }
3859
3860       /* Now look only at the cases where we have a filled JUMP_INSN.  */
3861       if (GET_CODE (XVECEXP (PATTERN (insn), 0, 0)) != JUMP_INSN
3862           || ! (condjump_p (XVECEXP (PATTERN (insn), 0, 0))
3863                 || condjump_in_parallel_p (XVECEXP (PATTERN (insn), 0, 0))))
3864         continue;
3865
3866       target_label = JUMP_LABEL (delay_insn);
3867
3868       if (target_label)
3869         {
3870           /* If this jump goes to another unconditional jump, thread it, but
3871              don't convert a jump into a RETURN here.  */
3872           trial = follow_jumps (target_label);
3873           /* We use next_real_insn instead of next_active_insn, so that
3874              the special USE insns emitted by reorg won't be ignored.
3875              If they are ignored, then they will get deleted if target_label
3876              is now unreachable, and that would cause mark_target_live_regs
3877              to fail.  */
3878           trial = prev_label (next_real_insn (trial));
3879           if (trial == 0 && target_label != 0)
3880             trial = find_end_label ();
3881
3882           if (trial != target_label
3883               && redirect_with_delay_slots_safe_p (delay_insn, trial, insn))
3884             {
3885               reorg_redirect_jump (delay_insn, trial);
3886               target_label = trial;
3887             }
3888
3889           /* If the first insn at TARGET_LABEL is redundant with a previous
3890              insn, redirect the jump to the following insn process again.  */
3891           trial = next_active_insn (target_label);
3892           if (trial && GET_CODE (PATTERN (trial)) != SEQUENCE
3893               && redundant_insn (trial, insn, 0))
3894             {
3895               trial = next_active_insn (trial);
3896               if (trial == 0)
3897                 target_label = find_end_label ();
3898               else
3899                 target_label = get_label_before (trial);
3900               reorg_redirect_jump (delay_insn, target_label);
3901               next = insn;
3902               continue;
3903             }
3904
3905           /* Similarly, if it is an unconditional jump with one insn in its
3906              delay list and that insn is redundant, thread the jump.  */
3907           if (trial && GET_CODE (PATTERN (trial)) == SEQUENCE
3908               && XVECLEN (PATTERN (trial), 0) == 2
3909               && GET_CODE (XVECEXP (PATTERN (trial), 0, 0)) == JUMP_INSN
3910               && (simplejump_p (XVECEXP (PATTERN (trial), 0, 0))
3911                   || GET_CODE (PATTERN (XVECEXP (PATTERN (trial), 0, 0))) == RETURN)
3912               && redundant_insn (XVECEXP (PATTERN (trial), 0, 1), insn, 0))
3913             {
3914               target_label = JUMP_LABEL (XVECEXP (PATTERN (trial), 0, 0));
3915               if (target_label == 0)
3916                 target_label = find_end_label ();
3917
3918               if (redirect_with_delay_slots_safe_p (delay_insn, target_label,
3919                                                     insn))
3920                 {
3921                   reorg_redirect_jump (delay_insn, target_label);
3922                   next = insn;
3923                   continue;
3924                 }
3925             }
3926         }
3927
3928       if (! INSN_ANNULLED_BRANCH_P (delay_insn)
3929           && prev_active_insn (target_label) == insn
3930           && ! condjump_in_parallel_p (delay_insn)
3931 #ifdef HAVE_cc0
3932           /* If the last insn in the delay slot sets CC0 for some insn,
3933              various code assumes that it is in a delay slot.  We could
3934              put it back where it belonged and delete the register notes,
3935              but it doesn't seem worthwhile in this uncommon case.  */
3936           && ! find_reg_note (XVECEXP (pat, 0, XVECLEN (pat, 0) - 1),
3937                               REG_CC_USER, NULL_RTX)
3938 #endif
3939           )
3940         {
3941           int i;
3942
3943           /* All this insn does is execute its delay list and jump to the
3944              following insn.  So delete the jump and just execute the delay
3945              list insns.
3946
3947              We do this by deleting the INSN containing the SEQUENCE, then
3948              re-emitting the insns separately, and then deleting the jump.
3949              This allows the count of the jump target to be properly
3950              decremented.  */
3951
3952           /* Clear the from target bit, since these insns are no longer
3953              in delay slots.  */
3954           for (i = 0; i < XVECLEN (pat, 0); i++)
3955             INSN_FROM_TARGET_P (XVECEXP (pat, 0, i)) = 0;
3956
3957           trial = PREV_INSN (insn);
3958           delete_insn (insn);
3959           emit_insn_after (pat, trial);
3960           delete_scheduled_jump (delay_insn);
3961           continue;
3962         }
3963
3964       /* See if this is an unconditional jump around a single insn which is
3965          identical to the one in its delay slot.  In this case, we can just
3966          delete the branch and the insn in its delay slot.  */
3967       if (next && GET_CODE (next) == INSN
3968           && prev_label (next_active_insn (next)) == target_label
3969           && simplejump_p (insn)
3970           && XVECLEN (pat, 0) == 2
3971           && rtx_equal_p (PATTERN (next), PATTERN (XVECEXP (pat, 0, 1))))
3972         {
3973           delete_insn (insn);
3974           continue;
3975         }
3976
3977       /* See if this jump (with its delay slots) branches around another
3978          jump (without delay slots).  If so, invert this jump and point
3979          it to the target of the second jump.  We cannot do this for
3980          annulled jumps, though.  Again, don't convert a jump to a RETURN
3981          here.  */
3982       if (! INSN_ANNULLED_BRANCH_P (delay_insn)
3983           && next && GET_CODE (next) == JUMP_INSN
3984           && (simplejump_p (next) || GET_CODE (PATTERN (next)) == RETURN)
3985           && next_active_insn (target_label) == next_active_insn (next)
3986           && no_labels_between_p (insn, next))
3987         {
3988           rtx label = JUMP_LABEL (next);
3989           rtx old_label = JUMP_LABEL (delay_insn);
3990
3991           if (label == 0)
3992             label = find_end_label ();
3993
3994           if (redirect_with_delay_slots_safe_p (delay_insn, label, insn))
3995             {
3996               /* Be careful how we do this to avoid deleting code or labels
3997                  that are momentarily dead.  See similar optimization in
3998                  jump.c  */
3999               if (old_label)
4000                 ++LABEL_NUSES (old_label);
4001
4002               if (invert_jump (delay_insn, label))
4003                 {
4004                   int i;
4005
4006                   /* Must update the INSN_FROM_TARGET_P bits now that
4007                      the branch is reversed, so that mark_target_live_regs
4008                      will handle the delay slot insn correctly.  */
4009                   for (i = 1; i < XVECLEN (PATTERN (insn), 0); i++)
4010                     {
4011                       rtx slot = XVECEXP (PATTERN (insn), 0, i);
4012                       INSN_FROM_TARGET_P (slot) = ! INSN_FROM_TARGET_P (slot);
4013                     }
4014
4015                   delete_insn (next);
4016                   next = insn;
4017                 }
4018
4019               if (old_label && --LABEL_NUSES (old_label) == 0)
4020                 delete_insn (old_label);
4021               continue;
4022             }
4023         }
4024
4025       /* If we own the thread opposite the way this insn branches, see if we
4026          can merge its delay slots with following insns.  */
4027       if (INSN_FROM_TARGET_P (XVECEXP (pat, 0, 1))
4028           && own_thread_p (NEXT_INSN (insn), 0, 1))
4029         try_merge_delay_insns (insn, next);
4030       else if (! INSN_FROM_TARGET_P (XVECEXP (pat, 0, 1))
4031                && own_thread_p (target_label, target_label, 0))
4032         try_merge_delay_insns (insn, next_active_insn (target_label));
4033
4034       /* If we get here, we haven't deleted INSN.  But we may have deleted
4035          NEXT, so recompute it.  */
4036       next = next_active_insn (insn);
4037     }
4038 }
4039 \f
4040 #ifdef HAVE_return
4041
4042 /* Look for filled jumps to the end of function label.  We can try to convert
4043    them into RETURN insns if the insns in the delay slot are valid for the
4044    RETURN as well.  */
4045
4046 static void
4047 make_return_insns (first)
4048      rtx first;
4049 {
4050   rtx insn, jump_insn, pat;
4051   rtx real_return_label = end_of_function_label;
4052   int slots, i;
4053
4054   /* See if there is a RETURN insn in the function other than the one we
4055      made for END_OF_FUNCTION_LABEL.  If so, set up anything we can't change
4056      into a RETURN to jump to it.  */
4057   for (insn = first; insn; insn = NEXT_INSN (insn))
4058     if (GET_CODE (insn) == JUMP_INSN && GET_CODE (PATTERN (insn)) == RETURN)
4059       {
4060         real_return_label = get_label_before (insn);
4061         break;
4062       }
4063
4064   /* Show an extra usage of REAL_RETURN_LABEL so it won't go away if it
4065      was equal to END_OF_FUNCTION_LABEL.  */
4066   LABEL_NUSES (real_return_label)++;
4067
4068   /* Clear the list of insns to fill so we can use it.  */
4069   obstack_free (&unfilled_slots_obstack, unfilled_firstobj);
4070
4071   for (insn = first; insn; insn = NEXT_INSN (insn))
4072     {
4073       int flags;
4074
4075       /* Only look at filled JUMP_INSNs that go to the end of function
4076          label.  */
4077       if (GET_CODE (insn) != INSN
4078           || GET_CODE (PATTERN (insn)) != SEQUENCE
4079           || GET_CODE (XVECEXP (PATTERN (insn), 0, 0)) != JUMP_INSN
4080           || JUMP_LABEL (XVECEXP (PATTERN (insn), 0, 0)) != end_of_function_label)
4081         continue;
4082
4083       pat = PATTERN (insn);
4084       jump_insn = XVECEXP (pat, 0, 0);
4085
4086       /* If we can't make the jump into a RETURN, try to redirect it to the best
4087          RETURN and go on to the next insn.  */
4088       if (! reorg_redirect_jump (jump_insn, NULL_RTX))
4089         {
4090           /* Make sure redirecting the jump will not invalidate the delay
4091              slot insns.  */
4092           if (redirect_with_delay_slots_safe_p (jump_insn,
4093                                                 real_return_label,
4094                                                 insn))
4095             reorg_redirect_jump (jump_insn, real_return_label);
4096           continue;
4097         }
4098
4099       /* See if this RETURN can accept the insns current in its delay slot.
4100          It can if it has more or an equal number of slots and the contents
4101          of each is valid.  */
4102
4103       flags = get_jump_flags (jump_insn, JUMP_LABEL (jump_insn));
4104       slots = num_delay_slots (jump_insn);
4105       if (slots >= XVECLEN (pat, 0) - 1)
4106         {
4107           for (i = 1; i < XVECLEN (pat, 0); i++)
4108             if (! (
4109 #ifdef ANNUL_IFFALSE_SLOTS
4110                    (INSN_ANNULLED_BRANCH_P (jump_insn)
4111                     && INSN_FROM_TARGET_P (XVECEXP (pat, 0, i)))
4112                    ? eligible_for_annul_false (jump_insn, i - 1,
4113                                                XVECEXP (pat, 0, i), flags) :
4114 #endif
4115 #ifdef ANNUL_IFTRUE_SLOTS
4116                    (INSN_ANNULLED_BRANCH_P (jump_insn)
4117                     && ! INSN_FROM_TARGET_P (XVECEXP (pat, 0, i)))
4118                    ? eligible_for_annul_true (jump_insn, i - 1,
4119                                               XVECEXP (pat, 0, i), flags) :
4120 #endif
4121                    eligible_for_delay (jump_insn, i -1, XVECEXP (pat, 0, i), flags)))
4122               break;
4123         }
4124       else
4125         i = 0;
4126
4127       if (i == XVECLEN (pat, 0))
4128         continue;
4129
4130       /* We have to do something with this insn.  If it is an unconditional
4131          RETURN, delete the SEQUENCE and output the individual insns,
4132          followed by the RETURN.  Then set things up so we try to find
4133          insns for its delay slots, if it needs some.  */
4134       if (GET_CODE (PATTERN (jump_insn)) == RETURN)
4135         {
4136           rtx prev = PREV_INSN (insn);
4137
4138           delete_insn (insn);
4139           for (i = 1; i < XVECLEN (pat, 0); i++)
4140             prev = emit_insn_after (PATTERN (XVECEXP (pat, 0, i)), prev);
4141
4142           insn = emit_jump_insn_after (PATTERN (jump_insn), prev);
4143           emit_barrier_after (insn);
4144
4145           if (slots)
4146             obstack_ptr_grow (&unfilled_slots_obstack, insn);
4147         }
4148       else
4149         /* It is probably more efficient to keep this with its current
4150            delay slot as a branch to a RETURN.  */
4151         reorg_redirect_jump (jump_insn, real_return_label);
4152     }
4153
4154   /* Now delete REAL_RETURN_LABEL if we never used it.  Then try to fill any
4155      new delay slots we have created.  */
4156   if (--LABEL_NUSES (real_return_label) == 0)
4157     delete_insn (real_return_label);
4158
4159   fill_simple_delay_slots (first, 1);
4160   fill_simple_delay_slots (first, 0);
4161 }
4162 #endif
4163 \f
4164 /* Try to find insns to place in delay slots.  */
4165
4166 void
4167 dbr_schedule (first, file)
4168      rtx first;
4169      FILE *file;
4170 {
4171   rtx insn, next, epilogue_insn = 0;
4172   int i;
4173 #if 0
4174   int old_flag_no_peephole = flag_no_peephole;
4175
4176   /* Execute `final' once in prescan mode to delete any insns that won't be
4177      used.  Don't let final try to do any peephole optimization--it will
4178      ruin dataflow information for this pass.  */
4179
4180   flag_no_peephole = 1;
4181   final (first, 0, NO_DEBUG, 1, 1);
4182   flag_no_peephole = old_flag_no_peephole;
4183 #endif
4184
4185   /* If the current function has no insns other than the prologue and
4186      epilogue, then do not try to fill any delay slots.  */
4187   if (n_basic_blocks == 0)
4188     return;
4189
4190   /* Find the highest INSN_UID and allocate and initialize our map from
4191      INSN_UID's to position in code.  */
4192   for (max_uid = 0, insn = first; insn; insn = NEXT_INSN (insn))
4193     {
4194       if (INSN_UID (insn) > max_uid)
4195         max_uid = INSN_UID (insn);
4196       if (GET_CODE (insn) == NOTE
4197           && NOTE_LINE_NUMBER (insn) == NOTE_INSN_EPILOGUE_BEG)
4198         epilogue_insn = insn;
4199     }
4200
4201   uid_to_ruid = (int *) alloca ((max_uid + 1) * sizeof (int *));
4202   for (i = 0, insn = first; insn; i++, insn = NEXT_INSN (insn))
4203     uid_to_ruid[INSN_UID (insn)] = i;
4204
4205   /* Initialize the list of insns that need filling.  */
4206   if (unfilled_firstobj == 0)
4207     {
4208       gcc_obstack_init (&unfilled_slots_obstack);
4209       unfilled_firstobj = (rtx *) obstack_alloc (&unfilled_slots_obstack, 0);
4210     }
4211
4212   for (insn = next_active_insn (first); insn; insn = next_active_insn (insn))
4213     {
4214       rtx target;
4215
4216       INSN_ANNULLED_BRANCH_P (insn) = 0;
4217       INSN_FROM_TARGET_P (insn) = 0;
4218
4219       /* Skip vector tables.  We can't get attributes for them.  */
4220       if (GET_CODE (insn) == JUMP_INSN
4221           && (GET_CODE (PATTERN (insn)) == ADDR_VEC
4222               || GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC))
4223         continue;
4224
4225       if (num_delay_slots (insn) > 0)
4226         obstack_ptr_grow (&unfilled_slots_obstack, insn);
4227
4228       /* Ensure all jumps go to the last of a set of consecutive labels.  */
4229       if (GET_CODE (insn) == JUMP_INSN
4230           && (condjump_p (insn) || condjump_in_parallel_p (insn))
4231           && JUMP_LABEL (insn) != 0
4232           && ((target = prev_label (next_active_insn (JUMP_LABEL (insn))))
4233               != JUMP_LABEL (insn)))
4234         redirect_jump (insn, target);
4235     }
4236
4237   /* Indicate what resources are required to be valid at the end of the current
4238      function.  The condition code never is and memory always is.  If the
4239      frame pointer is needed, it is and so is the stack pointer unless
4240      EXIT_IGNORE_STACK is non-zero.  If the frame pointer is not needed, the
4241      stack pointer is.  Registers used to return the function value are
4242      needed.  Registers holding global variables are needed.  */
4243
4244   end_of_function_needs.cc = 0;
4245   end_of_function_needs.memory = 1;
4246   CLEAR_HARD_REG_SET (end_of_function_needs.regs);
4247
4248   if (frame_pointer_needed)
4249     {
4250       SET_HARD_REG_BIT (end_of_function_needs.regs, FRAME_POINTER_REGNUM);
4251 #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM
4252       SET_HARD_REG_BIT (end_of_function_needs.regs, HARD_FRAME_POINTER_REGNUM);
4253 #endif
4254 #ifdef EXIT_IGNORE_STACK
4255       if (! EXIT_IGNORE_STACK)
4256 #endif
4257         SET_HARD_REG_BIT (end_of_function_needs.regs, STACK_POINTER_REGNUM);
4258     }
4259   else
4260     SET_HARD_REG_BIT (end_of_function_needs.regs, STACK_POINTER_REGNUM);
4261
4262   if (current_function_return_rtx != 0
4263       && GET_CODE (current_function_return_rtx) == REG)
4264     mark_referenced_resources (current_function_return_rtx,
4265                                &end_of_function_needs, 1);
4266
4267   for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
4268     if (global_regs[i])
4269       SET_HARD_REG_BIT (end_of_function_needs.regs, i);
4270
4271   /* The registers required to be live at the end of the function are
4272      represented in the flow information as being dead just prior to
4273      reaching the end of the function.  For example, the return of a value
4274      might be represented by a USE of the return register immediately
4275      followed by an unconditional jump to the return label where the
4276      return label is the end of the RTL chain.  The end of the RTL chain
4277      is then taken to mean that the return register is live.
4278
4279      This sequence is no longer maintained when epilogue instructions are
4280      added to the RTL chain.  To reconstruct the original meaning, the
4281      start of the epilogue (NOTE_INSN_EPILOGUE_BEG) is regarded as the
4282      point where these registers become live (start_of_epilogue_needs).
4283      If epilogue instructions are present, the registers set by those
4284      instructions won't have been processed by flow.  Thus, those
4285      registers are additionally required at the end of the RTL chain
4286      (end_of_function_needs).  */
4287
4288   start_of_epilogue_needs = end_of_function_needs;
4289
4290   while (epilogue_insn = next_nonnote_insn (epilogue_insn))
4291     mark_set_resources (epilogue_insn, &end_of_function_needs, 0, 1);
4292
4293   /* Show we haven't computed an end-of-function label yet.  */
4294   end_of_function_label = 0;
4295
4296   /* Allocate and initialize the tables used by mark_target_live_regs.  */
4297   target_hash_table
4298     = (struct target_info **) alloca ((TARGET_HASH_PRIME
4299                                        * sizeof (struct target_info *)));
4300   bzero ((char *) target_hash_table,
4301          TARGET_HASH_PRIME * sizeof (struct target_info *));
4302
4303   bb_ticks = (int *) alloca (n_basic_blocks * sizeof (int));
4304   bzero ((char *) bb_ticks, n_basic_blocks * sizeof (int));
4305
4306   /* Initialize the statistics for this function.  */
4307   bzero ((char *) num_insns_needing_delays, sizeof num_insns_needing_delays);
4308   bzero ((char *) num_filled_delays, sizeof num_filled_delays);
4309
4310   /* Now do the delay slot filling.  Try everything twice in case earlier
4311      changes make more slots fillable.  */
4312
4313   for (reorg_pass_number = 0;
4314        reorg_pass_number < MAX_REORG_PASSES;
4315        reorg_pass_number++)
4316     {
4317       fill_simple_delay_slots (first, 1);
4318       fill_simple_delay_slots (first, 0);
4319       fill_eager_delay_slots (first);
4320       relax_delay_slots (first);
4321     }
4322
4323   /* Delete any USE insns made by update_block; subsequent passes don't need
4324      them or know how to deal with them.  */
4325   for (insn = first; insn; insn = next)
4326     {
4327       next = NEXT_INSN (insn);
4328
4329       if (GET_CODE (insn) == INSN && GET_CODE (PATTERN (insn)) == USE
4330           && GET_RTX_CLASS (GET_CODE (XEXP (PATTERN (insn), 0))) == 'i')
4331         next = delete_insn (insn);
4332     }
4333
4334   /* If we made an end of function label, indicate that it is now
4335      safe to delete it by undoing our prior adjustment to LABEL_NUSES.
4336      If it is now unused, delete it.  */
4337   if (end_of_function_label && --LABEL_NUSES (end_of_function_label) == 0)
4338     delete_insn (end_of_function_label);
4339
4340 #ifdef HAVE_return
4341   if (HAVE_return && end_of_function_label != 0)
4342     make_return_insns (first);
4343 #endif
4344
4345   obstack_free (&unfilled_slots_obstack, unfilled_firstobj);
4346
4347   /* It is not clear why the line below is needed, but it does seem to be.  */
4348   unfilled_firstobj = (rtx *) obstack_alloc (&unfilled_slots_obstack, 0);
4349
4350   /* Reposition the prologue and epilogue notes in case we moved the
4351      prologue/epilogue insns.  */
4352   reposition_prologue_and_epilogue_notes (first);
4353
4354   if (file)
4355     {
4356       register int i, j, need_comma;
4357
4358       for (reorg_pass_number = 0;
4359            reorg_pass_number < MAX_REORG_PASSES;
4360            reorg_pass_number++)
4361         {
4362           fprintf (file, ";; Reorg pass #%d:\n", reorg_pass_number + 1);
4363           for (i = 0; i < NUM_REORG_FUNCTIONS; i++)
4364             {
4365               need_comma = 0;
4366               fprintf (file, ";; Reorg function #%d\n", i);
4367
4368               fprintf (file, ";; %d insns needing delay slots\n;; ",
4369                        num_insns_needing_delays[i][reorg_pass_number]);
4370
4371               for (j = 0; j < MAX_DELAY_HISTOGRAM; j++)
4372                 if (num_filled_delays[i][j][reorg_pass_number])
4373                   {
4374                     if (need_comma)
4375                       fprintf (file, ", ");
4376                     need_comma = 1;
4377                     fprintf (file, "%d got %d delays",
4378                              num_filled_delays[i][j][reorg_pass_number], j);
4379                   }
4380               fprintf (file, "\n");
4381             }
4382         }
4383     }
4384 }
4385 #endif /* DELAY_SLOTS */