gcc/haifa-sched.c

   1 /* Instruction scheduling pass.
   2    Copyright (C) 1992, 1993, 1994, 1995, 1996, 1997, 1998,
   3    1999, 2000, 2001, 2002, 2003, 2004 Free Software Foundation, Inc.
   4    Contributed by Michael Tiemann (tiemann@cygnus.com) Enhanced by,
   5    and currently maintained by, Jim Wilson (wilson@cygnus.com)
   6
   7 This file is part of GCC.
   8
   9 GCC is free software; you can redistribute it and/or modify it under
  10 the terms of the GNU General Public License as published by the Free
  11 Software Foundation; either version 2, or (at your option) any later
  12 version.
  13
  14 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  15 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  16 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  17 for more details.
  18
  19 You should have received a copy of the GNU General Public License
  20 along with GCC; see the file COPYING.  If not, write to the Free
  21 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  22 02111-1307, USA.  */
  23
  24 /* Instruction scheduling pass.  This file, along with sched-deps.c,
  25    contains the generic parts.  The actual entry point is found for
  26    the normal instruction scheduling pass is found in sched-rgn.c.
  27
  28    We compute insn priorities based on data dependencies.  Flow
  29    analysis only creates a fraction of the data-dependencies we must
  30    observe: namely, only those dependencies which the combiner can be
  31    expected to use.  For this pass, we must therefore create the
  32    remaining dependencies we need to observe: register dependencies,
  33    memory dependencies, dependencies to keep function calls in order,
  34    and the dependence between a conditional branch and the setting of
  35    condition codes are all dealt with here.
  36
  37    The scheduler first traverses the data flow graph, starting with
  38    the last instruction, and proceeding to the first, assigning values
  39    to insn_priority as it goes.  This sorts the instructions
  40    topologically by data dependence.
  41
  42    Once priorities have been established, we order the insns using
  43    list scheduling.  This works as follows: starting with a list of
  44    all the ready insns, and sorted according to priority number, we
  45    schedule the insn from the end of the list by placing its
  46    predecessors in the list according to their priority order.  We
  47    consider this insn scheduled by setting the pointer to the "end" of
  48    the list to point to the previous insn.  When an insn has no
  49    predecessors, we either queue it until sufficient time has elapsed
  50    or add it to the ready list.  As the instructions are scheduled or
  51    when stalls are introduced, the queue advances and dumps insns into
  52    the ready list.  When all insns down to the lowest priority have
  53    been scheduled, the critical path of the basic block has been made
  54    as short as possible.  The remaining insns are then scheduled in
  55    remaining slots.
  56
  57    The following list shows the order in which we want to break ties
  58    among insns in the ready list:
  59
  60    1.  choose insn with the longest path to end of bb, ties
  61    broken by
  62    2.  choose insn with least contribution to register pressure,
  63    ties broken by
  64    3.  prefer in-block upon interblock motion, ties broken by
  65    4.  prefer useful upon speculative motion, ties broken by
  66    5.  choose insn with largest control flow probability, ties
  67    broken by
  68    6.  choose insn with the least dependences upon the previously
  69    scheduled insn, or finally
  70    7   choose the insn which has the most insns dependent on it.
  71    8.  choose insn with lowest UID.
  72
  73    Memory references complicate matters.  Only if we can be certain
  74    that memory references are not part of the data dependency graph
  75    (via true, anti, or output dependence), can we move operations past
  76    memory references.  To first approximation, reads can be done
  77    independently, while writes introduce dependencies.  Better
  78    approximations will yield fewer dependencies.
  79
  80    Before reload, an extended analysis of interblock data dependences
  81    is required for interblock scheduling.  This is performed in
  82    compute_block_backward_dependences ().
  83
  84    Dependencies set up by memory references are treated in exactly the
  85    same way as other dependencies, by using LOG_LINKS backward
  86    dependences.  LOG_LINKS are translated into INSN_DEPEND forward
  87    dependences for the purpose of forward list scheduling.
  88
  89    Having optimized the critical path, we may have also unduly
  90    extended the lifetimes of some registers.  If an operation requires
  91    that constants be loaded into registers, it is certainly desirable
  92    to load those constants as early as necessary, but no earlier.
  93    I.e., it will not do to load up a bunch of registers at the
  94    beginning of a basic block only to use them at the end, if they
  95    could be loaded later, since this may result in excessive register
  96    utilization.
  97
  98    Note that since branches are never in basic blocks, but only end
  99    basic blocks, this pass will not move branches.  But that is ok,
 100    since we can use GNU's delayed branch scheduling pass to take care
 101    of this case.
 102
 103    Also note that no further optimizations based on algebraic
 104    identities are performed, so this pass would be a good one to
 105    perform instruction splitting, such as breaking up a multiply
 106    instruction into shifts and adds where that is profitable.
 107
 108    Given the memory aliasing analysis that this pass should perform,
 109    it should be possible to remove redundant stores to memory, and to
 110    load values from registers instead of hitting memory.
 111
 112    Before reload, speculative insns are moved only if a 'proof' exists
 113    that no exception will be caused by this, and if no live registers
 114    exist that inhibit the motion (live registers constraints are not
 115    represented by data dependence edges).
 116
 117    This pass must update information that subsequent passes expect to
 118    be correct.  Namely: reg_n_refs, reg_n_sets, reg_n_deaths,
 119    reg_n_calls_crossed, and reg_live_length.  Also, BB_HEAD, BB_END.
 120
 121    The information in the line number notes is carefully retained by
 122    this pass.  Notes that refer to the starting and ending of
 123    exception regions are also carefully retained by this pass.  All
 124    other NOTE insns are grouped in their same relative order at the
 125    beginning of basic blocks and regions that have been scheduled.  */
 126 \f
 127 #include "config.h"
 128 #include "system.h"
 129 #include "coretypes.h"
 130 #include "tm.h"
 131 #include "toplev.h"
 132 #include "rtl.h"
 133 #include "tm_p.h"
 134 #include "hard-reg-set.h"
 135 #include "regs.h"
 136 #include "function.h"
 137 #include "flags.h"
 138 #include "insn-config.h"
 139 #include "insn-attr.h"
 140 #include "except.h"
 141 #include "toplev.h"
 142 #include "recog.h"
 143 #include "sched-int.h"
 144 #include "target.h"
 145
 146 #ifdef INSN_SCHEDULING
 147
 148 /* issue_rate is the number of insns that can be scheduled in the same
 149    machine cycle.  It can be defined in the config/mach/mach.h file,
 150    otherwise we set it to 1.  */
 151
 152 static int issue_rate;
 153
 154 /* sched-verbose controls the amount of debugging output the
 155    scheduler prints.  It is controlled by -fsched-verbose=N:
 156    N>0 and no -DSR : the output is directed to stderr.
 157    N>=10 will direct the printouts to stderr (regardless of -dSR).
 158    N=1: same as -dSR.
 159    N=2: bb's probabilities, detailed ready list info, unit/insn info.
 160    N=3: rtl at abort point, control-flow, regions info.
 161    N=5: dependences info.  */
 162
 163 static int sched_verbose_param = 0;
 164 int sched_verbose = 0;
 165
 166 /* Debugging file.  All printouts are sent to dump, which is always set,
 167    either to stderr, or to the dump listing file (-dRS).  */
 168 FILE *sched_dump = 0;
 169
 170 /* Highest uid before scheduling.  */
 171 static int old_max_uid;
 172
 173 /* fix_sched_param() is called from toplev.c upon detection
 174    of the -fsched-verbose=N option.  */
 175
 176 void
 177 fix_sched_param (const char *param, const char *val)
 178 {
 179   if (!strcmp (param, "verbose"))
 180     sched_verbose_param = atoi (val);
 181   else
 182     warning ("fix_sched_param: unknown param: %s", param);
 183 }
 184
 185 struct haifa_insn_data *h_i_d;
 186
 187 #define LINE_NOTE(INSN)         (h_i_d[INSN_UID (INSN)].line_note)
 188 #define INSN_TICK(INSN)         (h_i_d[INSN_UID (INSN)].tick)
 189
 190 /* Vector indexed by basic block number giving the starting line-number
 191    for each basic block.  */
 192 static rtx *line_note_head;
 193
 194 /* List of important notes we must keep around.  This is a pointer to the
 195    last element in the list.  */
 196 static rtx note_list;
 197
 198 /* Queues, etc.  */
 199
 200 /* An instruction is ready to be scheduled when all insns preceding it
 201    have already been scheduled.  It is important to ensure that all
 202    insns which use its result will not be executed until its result
 203    has been computed.  An insn is maintained in one of four structures:
 204
 205    (P) the "Pending" set of insns which cannot be scheduled until
 206    their dependencies have been satisfied.
 207    (Q) the "Queued" set of insns that can be scheduled when sufficient
 208    time has passed.
 209    (R) the "Ready" list of unscheduled, uncommitted insns.
 210    (S) the "Scheduled" list of insns.
 211
 212    Initially, all insns are either "Pending" or "Ready" depending on
 213    whether their dependencies are satisfied.
 214
 215    Insns move from the "Ready" list to the "Scheduled" list as they
 216    are committed to the schedule.  As this occurs, the insns in the
 217    "Pending" list have their dependencies satisfied and move to either
 218    the "Ready" list or the "Queued" set depending on whether
 219    sufficient time has passed to make them ready.  As time passes,
 220    insns move from the "Queued" set to the "Ready" list.
 221
 222    The "Pending" list (P) are the insns in the INSN_DEPEND of the unscheduled
 223    insns, i.e., those that are ready, queued, and pending.
 224    The "Queued" set (Q) is implemented by the variable `insn_queue'.
 225    The "Ready" list (R) is implemented by the variables `ready' and
 226    `n_ready'.
 227    The "Scheduled" list (S) is the new insn chain built by this pass.
 228
 229    The transition (R->S) is implemented in the scheduling loop in
 230    `schedule_block' when the best insn to schedule is chosen.
 231    The transitions (P->R and P->Q) are implemented in `schedule_insn' as
 232    insns move from the ready list to the scheduled list.
 233    The transition (Q->R) is implemented in 'queue_to_insn' as time
 234    passes or stalls are introduced.  */
 235
 236 /* Implement a circular buffer to delay instructions until sufficient
 237    time has passed.  For the new pipeline description interface,
 238    MAX_INSN_QUEUE_INDEX is a power of two minus one which is larger
 239    than maximal time of instruction execution computed by genattr.c on
 240    the base maximal time of functional unit reservations and getting a
 241    result.  This is the longest time an insn may be queued.  */
 242
 243 static rtx *insn_queue;
 244 static int q_ptr = 0;
 245 static int q_size = 0;
 246 #define NEXT_Q(X) (((X)+1) & max_insn_queue_index)
 247 #define NEXT_Q_AFTER(X, C) (((X)+C) & max_insn_queue_index)
 248
 249 /* The following variable value refers for all current and future
 250    reservations of the processor units.  */
 251 state_t curr_state;
 252
 253 /* The following variable value is size of memory representing all
 254    current and future reservations of the processor units.  */
 255 static size_t dfa_state_size;
 256
 257 /* The following array is used to find the best insn from ready when
 258    the automaton pipeline interface is used.  */
 259 static char *ready_try;
 260
 261 /* Describe the ready list of the scheduler.
 262    VEC holds space enough for all insns in the current region.  VECLEN
 263    says how many exactly.
 264    FIRST is the index of the element with the highest priority; i.e. the
 265    last one in the ready list, since elements are ordered by ascending
 266    priority.
 267    N_READY determines how many insns are on the ready list.  */
 268
 269 struct ready_list
 270 {
 271   rtx *vec;
 272   int veclen;
 273   int first;
 274   int n_ready;
 275 };
 276
 277 static int may_trap_exp (rtx, int);
 278
 279 /* Nonzero iff the address is comprised from at most 1 register.  */
 280 #define CONST_BASED_ADDRESS_P(x)                        \
 281   (REG_P (x)                                    \
 282    || ((GET_CODE (x) == PLUS || GET_CODE (x) == MINUS   \
 283         || (GET_CODE (x) == LO_SUM))                    \
 284        && (CONSTANT_P (XEXP (x, 0))                     \
 285            || CONSTANT_P (XEXP (x, 1)))))
 286
 287 /* Returns a class that insn with GET_DEST(insn)=x may belong to,
 288    as found by analyzing insn's expression.  */
 289
 290 static int
 291 may_trap_exp (rtx x, int is_store)
 292 {
 293   enum rtx_code code;
 294
 295   if (x == 0)
 296     return TRAP_FREE;
 297   code = GET_CODE (x);
 298   if (is_store)
 299     {
 300       if (code == MEM && may_trap_p (x))
 301         return TRAP_RISKY;
 302       else
 303         return TRAP_FREE;
 304     }
 305   if (code == MEM)
 306     {
 307       /* The insn uses memory:  a volatile load.  */
 308       if (MEM_VOLATILE_P (x))
 309         return IRISKY;
 310       /* An exception-free load.  */
 311       if (!may_trap_p (x))
 312         return IFREE;
 313       /* A load with 1 base register, to be further checked.  */
 314       if (CONST_BASED_ADDRESS_P (XEXP (x, 0)))
 315         return PFREE_CANDIDATE;
 316       /* No info on the load, to be further checked.  */
 317       return PRISKY_CANDIDATE;
 318     }
 319   else
 320     {
 321       const char *fmt;
 322       int i, insn_class = TRAP_FREE;
 323
 324       /* Neither store nor load, check if it may cause a trap.  */
 325       if (may_trap_p (x))
 326         return TRAP_RISKY;
 327       /* Recursive step: walk the insn...  */
 328       fmt = GET_RTX_FORMAT (code);
 329       for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
 330         {
 331           if (fmt[i] == 'e')
 332             {
 333               int tmp_class = may_trap_exp (XEXP (x, i), is_store);
 334               insn_class = WORST_CLASS (insn_class, tmp_class);
 335             }
 336           else if (fmt[i] == 'E')
 337             {
 338               int j;
 339               for (j = 0; j < XVECLEN (x, i); j++)
 340                 {
 341                   int tmp_class = may_trap_exp (XVECEXP (x, i, j), is_store);
 342                   insn_class = WORST_CLASS (insn_class, tmp_class);
 343                   if (insn_class == TRAP_RISKY || insn_class == IRISKY)
 344                     break;
 345                 }
 346             }
 347           if (insn_class == TRAP_RISKY || insn_class == IRISKY)
 348             break;
 349         }
 350       return insn_class;
 351     }
 352 }
 353
 354 /* Classifies insn for the purpose of verifying that it can be
 355    moved speculatively, by examining it's patterns, returning:
 356    TRAP_RISKY: store, or risky non-load insn (e.g. division by variable).
 357    TRAP_FREE: non-load insn.
 358    IFREE: load from a globally safe location.
 359    IRISKY: volatile load.
 360    PFREE_CANDIDATE, PRISKY_CANDIDATE: load that need to be checked for
 361    being either PFREE or PRISKY.  */
 362
 363 int
 364 haifa_classify_insn (rtx insn)
 365 {
 366   rtx pat = PATTERN (insn);
 367   int tmp_class = TRAP_FREE;
 368   int insn_class = TRAP_FREE;
 369   enum rtx_code code;
 370
 371   if (GET_CODE (pat) == PARALLEL)
 372     {
 373       int i, len = XVECLEN (pat, 0);
 374
 375       for (i = len - 1; i >= 0; i--)
 376         {
 377           code = GET_CODE (XVECEXP (pat, 0, i));
 378           switch (code)
 379             {
 380             case CLOBBER:
 381               /* Test if it is a 'store'.  */
 382               tmp_class = may_trap_exp (XEXP (XVECEXP (pat, 0, i), 0), 1);
 383               break;
 384             case SET:
 385               /* Test if it is a store.  */
 386               tmp_class = may_trap_exp (SET_DEST (XVECEXP (pat, 0, i)), 1);
 387               if (tmp_class == TRAP_RISKY)
 388                 break;
 389               /* Test if it is a load.  */
 390               tmp_class
 391                 = WORST_CLASS (tmp_class,
 392                                may_trap_exp (SET_SRC (XVECEXP (pat, 0, i)),
 393                                              0));
 394               break;
 395             case COND_EXEC:
 396             case TRAP_IF:
 397               tmp_class = TRAP_RISKY;
 398               break;
 399             default:
 400               ;
 401             }
 402           insn_class = WORST_CLASS (insn_class, tmp_class);
 403           if (insn_class == TRAP_RISKY || insn_class == IRISKY)
 404             break;
 405         }
 406     }
 407   else
 408     {
 409       code = GET_CODE (pat);
 410       switch (code)
 411         {
 412         case CLOBBER:
 413           /* Test if it is a 'store'.  */
 414           tmp_class = may_trap_exp (XEXP (pat, 0), 1);
 415           break;
 416         case SET:
 417           /* Test if it is a store.  */
 418           tmp_class = may_trap_exp (SET_DEST (pat), 1);
 419           if (tmp_class == TRAP_RISKY)
 420             break;
 421           /* Test if it is a load.  */
 422           tmp_class =
 423             WORST_CLASS (tmp_class,
 424                          may_trap_exp (SET_SRC (pat), 0));
 425           break;
 426         case COND_EXEC:
 427         case TRAP_IF:
 428           tmp_class = TRAP_RISKY;
 429           break;
 430         default:;
 431         }
 432       insn_class = tmp_class;
 433     }
 434
 435   return insn_class;
 436 }
 437
 438 /* Forward declarations.  */
 439
 440 static int priority (rtx);
 441 static int rank_for_schedule (const void *, const void *);
 442 static void swap_sort (rtx *, int);
 443 static void queue_insn (rtx, int);
 444 static int schedule_insn (rtx, struct ready_list *, int);
 445 static int find_set_reg_weight (rtx);
 446 static void find_insn_reg_weight (int);
 447 static void adjust_priority (rtx);
 448 static void advance_one_cycle (void);
 449
 450 /* Notes handling mechanism:
 451    =========================
 452    Generally, NOTES are saved before scheduling and restored after scheduling.
 453    The scheduler distinguishes between three types of notes:
 454
 455    (1) LINE_NUMBER notes, generated and used for debugging.  Here,
 456    before scheduling a region, a pointer to the LINE_NUMBER note is
 457    added to the insn following it (in save_line_notes()), and the note
 458    is removed (in rm_line_notes() and unlink_line_notes()).  After
 459    scheduling the region, this pointer is used for regeneration of
 460    the LINE_NUMBER note (in restore_line_notes()).
 461
 462    (2) LOOP_BEGIN, LOOP_END, SETJMP, EHREGION_BEG, EHREGION_END notes:
 463    Before scheduling a region, a pointer to the note is added to the insn
 464    that follows or precedes it.  (This happens as part of the data dependence
 465    computation).  After scheduling an insn, the pointer contained in it is
 466    used for regenerating the corresponding note (in reemit_notes).
 467
 468    (3) All other notes (e.g. INSN_DELETED):  Before scheduling a block,
 469    these notes are put in a list (in rm_other_notes() and
 470    unlink_other_notes ()).  After scheduling the block, these notes are
 471    inserted at the beginning of the block (in schedule_block()).  */
 472
 473 static rtx unlink_other_notes (rtx, rtx);
 474 static rtx unlink_line_notes (rtx, rtx);
 475 static rtx reemit_notes (rtx, rtx);
 476
 477 static rtx *ready_lastpos (struct ready_list *);
 478 static void ready_sort (struct ready_list *);
 479 static rtx ready_remove_first (struct ready_list *);
 480
 481 static void queue_to_ready (struct ready_list *);
 482 static int early_queue_to_ready (state_t, struct ready_list *);
 483
 484 static void debug_ready_list (struct ready_list *);
 485
 486 static rtx move_insn1 (rtx, rtx);
 487 static rtx move_insn (rtx, rtx);
 488
 489 /* The following functions are used to implement multi-pass scheduling
 490    on the first cycle.  */
 491 static rtx ready_element (struct ready_list *, int);
 492 static rtx ready_remove (struct ready_list *, int);
 493 static int max_issue (struct ready_list *, int *);
 494
 495 static rtx choose_ready (struct ready_list *);
 496
 497 #endif /* INSN_SCHEDULING */
 498 \f
 499 /* Point to state used for the current scheduling pass.  */
 500 struct sched_info *current_sched_info;
 501 \f
 502 #ifndef INSN_SCHEDULING
 503 void
 504 schedule_insns (FILE *dump_file ATTRIBUTE_UNUSED)
 505 {
 506 }
 507 #else
 508
 509 /* Pointer to the last instruction scheduled.  Used by rank_for_schedule,
 510    so that insns independent of the last scheduled insn will be preferred
 511    over dependent instructions.  */
 512
 513 static rtx last_scheduled_insn;
 514
 515 /* Compute cost of executing INSN given the dependence LINK on the insn USED.
 516    This is the number of cycles between instruction issue and
 517    instruction results.  */
 518
 519 HAIFA_INLINE int
 520 insn_cost (rtx insn, rtx link, rtx used)
 521 {
 522   int cost = INSN_COST (insn);
 523
 524   if (cost < 0)
 525     {
 526       /* A USE insn, or something else we don't need to
 527          understand.  We can't pass these directly to
 528          result_ready_cost or insn_default_latency because it will
 529          trigger a fatal error for unrecognizable insns.  */
 530       if (recog_memoized (insn) < 0)
 531         {
 532           INSN_COST (insn) = 0;
 533           return 0;
 534         }
 535       else
 536         {
 537           cost = insn_default_latency (insn);
 538           if (cost < 0)
 539             cost = 0;
 540
 541           INSN_COST (insn) = cost;
 542         }
 543     }
 544
 545   /* In this case estimate cost without caring how insn is used.  */
 546   if (link == 0 || used == 0)
 547     return cost;
 548
 549   /* A USE insn should never require the value used to be computed.
 550      This allows the computation of a function's result and parameter
 551      values to overlap the return and call.  */
 552   if (recog_memoized (used) < 0)
 553     cost = 0;
 554   else
 555     {
 556       if (INSN_CODE (insn) >= 0)
 557         {
 558           if (REG_NOTE_KIND (link) == REG_DEP_ANTI)
 559             cost = 0;
 560           else if (REG_NOTE_KIND (link) == REG_DEP_OUTPUT)
 561             {
 562               cost = (insn_default_latency (insn)
 563                       - insn_default_latency (used));
 564               if (cost <= 0)
 565                 cost = 1;
 566             }
 567           else if (bypass_p (insn))
 568             cost = insn_latency (insn, used);
 569         }
 570
 571       if (targetm.sched.adjust_cost)
 572         cost = targetm.sched.adjust_cost (used, link, insn, cost);
 573
 574       if (cost < 0)
 575         cost = 0;
 576     }
 577
 578   return cost;
 579 }
 580
 581 /* Compute the priority number for INSN.  */
 582
 583 static int
 584 priority (rtx insn)
 585 {
 586   rtx link;
 587
 588   if (! INSN_P (insn))
 589     return 0;
 590
 591   if (! INSN_PRIORITY_KNOWN (insn))
 592     {
 593       int this_priority = 0;
 594
 595       if (INSN_DEPEND (insn) == 0)
 596         this_priority = insn_cost (insn, 0, 0);
 597       else
 598         {
 599           for (link = INSN_DEPEND (insn); link; link = XEXP (link, 1))
 600             {
 601               rtx next;
 602               int next_priority;
 603
 604               next = XEXP (link, 0);
 605
 606               /* Critical path is meaningful in block boundaries only.  */
 607               if (! (*current_sched_info->contributes_to_priority) (next, insn))
 608                 continue;
 609
 610               next_priority = insn_cost (insn, link, next) + priority (next);
 611               if (next_priority > this_priority)
 612                 this_priority = next_priority;
 613             }
 614         }
 615       INSN_PRIORITY (insn) = this_priority;
 616       INSN_PRIORITY_KNOWN (insn) = 1;
 617     }
 618
 619   return INSN_PRIORITY (insn);
 620 }
 621 \f
 622 /* Macros and functions for keeping the priority queue sorted, and
 623    dealing with queuing and dequeuing of instructions.  */
 624
 625 #define SCHED_SORT(READY, N_READY)                                   \
 626 do { if ((N_READY) == 2)                                             \
 627        swap_sort (READY, N_READY);                                   \
 628      else if ((N_READY) > 2)                                         \
 629          qsort (READY, N_READY, sizeof (rtx), rank_for_schedule); }  \
 630 while (0)
 631
 632 /* Returns a positive value if x is preferred; returns a negative value if
 633    y is preferred.  Should never return 0, since that will make the sort
 634    unstable.  */
 635
 636 static int
 637 rank_for_schedule (const void *x, const void *y)
 638 {
 639   rtx tmp = *(const rtx *) y;
 640   rtx tmp2 = *(const rtx *) x;
 641   rtx link;
 642   int tmp_class, tmp2_class, depend_count1, depend_count2;
 643   int val, priority_val, weight_val, info_val;
 644
 645   /* The insn in a schedule group should be issued the first.  */
 646   if (SCHED_GROUP_P (tmp) != SCHED_GROUP_P (tmp2))
 647     return SCHED_GROUP_P (tmp2) ? 1 : -1;
 648
 649   /* Prefer insn with higher priority.  */
 650   priority_val = INSN_PRIORITY (tmp2) - INSN_PRIORITY (tmp);
 651
 652   if (priority_val)
 653     return priority_val;
 654
 655   /* Prefer an insn with smaller contribution to registers-pressure.  */
 656   if (!reload_completed &&
 657       (weight_val = INSN_REG_WEIGHT (tmp) - INSN_REG_WEIGHT (tmp2)))
 658     return weight_val;
 659
 660   info_val = (*current_sched_info->rank) (tmp, tmp2);
 661   if (info_val)
 662     return info_val;
 663
 664   /* Compare insns based on their relation to the last-scheduled-insn.  */
 665   if (last_scheduled_insn)
 666     {
 667       /* Classify the instructions into three classes:
 668          1) Data dependent on last schedule insn.
 669          2) Anti/Output dependent on last scheduled insn.
 670          3) Independent of last scheduled insn, or has latency of one.
 671          Choose the insn from the highest numbered class if different.  */
 672       link = find_insn_list (tmp, INSN_DEPEND (last_scheduled_insn));
 673       if (link == 0 || insn_cost (last_scheduled_insn, link, tmp) == 1)
 674         tmp_class = 3;
 675       else if (REG_NOTE_KIND (link) == 0)       /* Data dependence.  */
 676         tmp_class = 1;
 677       else
 678         tmp_class = 2;
 679
 680       link = find_insn_list (tmp2, INSN_DEPEND (last_scheduled_insn));
 681       if (link == 0 || insn_cost (last_scheduled_insn, link, tmp2) == 1)
 682         tmp2_class = 3;
 683       else if (REG_NOTE_KIND (link) == 0)       /* Data dependence.  */
 684         tmp2_class = 1;
 685       else
 686         tmp2_class = 2;
 687
 688       if ((val = tmp2_class - tmp_class))
 689         return val;
 690     }
 691
 692   /* Prefer the insn which has more later insns that depend on it.
 693      This gives the scheduler more freedom when scheduling later
 694      instructions at the expense of added register pressure.  */
 695   depend_count1 = 0;
 696   for (link = INSN_DEPEND (tmp); link; link = XEXP (link, 1))
 697     depend_count1++;
 698
 699   depend_count2 = 0;
 700   for (link = INSN_DEPEND (tmp2); link; link = XEXP (link, 1))
 701     depend_count2++;
 702
 703   val = depend_count2 - depend_count1;
 704   if (val)
 705     return val;
 706
 707   /* If insns are equally good, sort by INSN_LUID (original insn order),
 708      so that we make the sort stable.  This minimizes instruction movement,
 709      thus minimizing sched's effect on debugging and cross-jumping.  */
 710   return INSN_LUID (tmp) - INSN_LUID (tmp2);
 711 }
 712
 713 /* Resort the array A in which only element at index N may be out of order.  */
 714
 715 HAIFA_INLINE static void
 716 swap_sort (rtx *a, int n)
 717 {
 718   rtx insn = a[n - 1];
 719   int i = n - 2;
 720
 721   while (i >= 0 && rank_for_schedule (a + i, &insn) >= 0)
 722     {
 723       a[i + 1] = a[i];
 724       i -= 1;
 725     }
 726   a[i + 1] = insn;
 727 }
 728
 729 /* Add INSN to the insn queue so that it can be executed at least
 730    N_CYCLES after the currently executing insn.  Preserve insns
 731    chain for debugging purposes.  */
 732
 733 HAIFA_INLINE static void
 734 queue_insn (rtx insn, int n_cycles)
 735 {
 736   int next_q = NEXT_Q_AFTER (q_ptr, n_cycles);
 737   rtx link = alloc_INSN_LIST (insn, insn_queue[next_q]);
 738   insn_queue[next_q] = link;
 739   q_size += 1;
 740
 741   if (sched_verbose >= 2)
 742     {
 743       fprintf (sched_dump, ";;\t\tReady-->Q: insn %s: ",
 744                (*current_sched_info->print_insn) (insn, 0));
 745
 746       fprintf (sched_dump, "queued for %d cycles.\n", n_cycles);
 747     }
 748 }
 749
 750 /* Return a pointer to the bottom of the ready list, i.e. the insn
 751    with the lowest priority.  */
 752
 753 HAIFA_INLINE static rtx *
 754 ready_lastpos (struct ready_list *ready)
 755 {
 756   if (ready->n_ready == 0)
 757     abort ();
 758   return ready->vec + ready->first - ready->n_ready + 1;
 759 }
 760
 761 /* Add an element INSN to the ready list so that it ends up with the lowest
 762    priority.  */
 763
 764 HAIFA_INLINE void
 765 ready_add (struct ready_list *ready, rtx insn)
 766 {
 767   if (ready->first == ready->n_ready)
 768     {
 769       memmove (ready->vec + ready->veclen - ready->n_ready,
 770                ready_lastpos (ready),
 771                ready->n_ready * sizeof (rtx));
 772       ready->first = ready->veclen - 1;
 773     }
 774   ready->vec[ready->first - ready->n_ready] = insn;
 775   ready->n_ready++;
 776 }
 777
 778 /* Remove the element with the highest priority from the ready list and
 779    return it.  */
 780
 781 HAIFA_INLINE static rtx
 782 ready_remove_first (struct ready_list *ready)
 783 {
 784   rtx t;
 785   if (ready->n_ready == 0)
 786     abort ();
 787   t = ready->vec[ready->first--];
 788   ready->n_ready--;
 789   /* If the queue becomes empty, reset it.  */
 790   if (ready->n_ready == 0)
 791     ready->first = ready->veclen - 1;
 792   return t;
 793 }
 794
 795 /* The following code implements multi-pass scheduling for the first
 796    cycle.  In other words, we will try to choose ready insn which
 797    permits to start maximum number of insns on the same cycle.  */
 798
 799 /* Return a pointer to the element INDEX from the ready.  INDEX for
 800    insn with the highest priority is 0, and the lowest priority has
 801    N_READY - 1.  */
 802
 803 HAIFA_INLINE static rtx
 804 ready_element (struct ready_list *ready, int index)
 805 {
 806 #ifdef ENABLE_CHECKING
 807   if (ready->n_ready == 0 || index >= ready->n_ready)
 808     abort ();
 809 #endif
 810   return ready->vec[ready->first - index];
 811 }
 812
 813 /* Remove the element INDEX from the ready list and return it.  INDEX
 814    for insn with the highest priority is 0, and the lowest priority
 815    has N_READY - 1.  */
 816
 817 HAIFA_INLINE static rtx
 818 ready_remove (struct ready_list *ready, int index)
 819 {
 820   rtx t;
 821   int i;
 822
 823   if (index == 0)
 824     return ready_remove_first (ready);
 825   if (ready->n_ready == 0 || index >= ready->n_ready)
 826     abort ();
 827   t = ready->vec[ready->first - index];
 828   ready->n_ready--;
 829   for (i = index; i < ready->n_ready; i++)
 830     ready->vec[ready->first - i] = ready->vec[ready->first - i - 1];
 831   return t;
 832 }
 833
 834
 835 /* Sort the ready list READY by ascending priority, using the SCHED_SORT
 836    macro.  */
 837
 838 HAIFA_INLINE static void
 839 ready_sort (struct ready_list *ready)
 840 {
 841   rtx *first = ready_lastpos (ready);
 842   SCHED_SORT (first, ready->n_ready);
 843 }
 844
 845 /* PREV is an insn that is ready to execute.  Adjust its priority if that
 846    will help shorten or lengthen register lifetimes as appropriate.  Also
 847    provide a hook for the target to tweek itself.  */
 848
 849 HAIFA_INLINE static void
 850 adjust_priority (rtx prev)
 851 {
 852   /* ??? There used to be code here to try and estimate how an insn
 853      affected register lifetimes, but it did it by looking at REG_DEAD
 854      notes, which we removed in schedule_region.  Nor did it try to
 855      take into account register pressure or anything useful like that.
 856
 857      Revisit when we have a machine model to work with and not before.  */
 858
 859   if (targetm.sched.adjust_priority)
 860     INSN_PRIORITY (prev) =
 861       targetm.sched.adjust_priority (prev, INSN_PRIORITY (prev));
 862 }
 863
 864 /* Advance time on one cycle.  */
 865 HAIFA_INLINE static void
 866 advance_one_cycle (void)
 867 {
 868   if (targetm.sched.dfa_pre_cycle_insn)
 869     state_transition (curr_state,
 870                       targetm.sched.dfa_pre_cycle_insn ());
 871
 872   state_transition (curr_state, NULL);
 873
 874   if (targetm.sched.dfa_post_cycle_insn)
 875     state_transition (curr_state,
 876                       targetm.sched.dfa_post_cycle_insn ());
 877 }
 878
 879 /* Clock at which the previous instruction was issued.  */
 880 static int last_clock_var;
 881
 882 /* INSN is the "currently executing insn".  Launch each insn which was
 883    waiting on INSN.  READY is the ready list which contains the insns
 884    that are ready to fire.  CLOCK is the current cycle.  The function
 885    returns necessary cycle advance after issuing the insn (it is not
 886    zero for insns in a schedule group).  */
 887
 888 static int
 889 schedule_insn (rtx insn, struct ready_list *ready, int clock)
 890 {
 891   rtx link;
 892   int advance = 0;
 893   int premature_issue = 0;
 894
 895   if (sched_verbose >= 1)
 896     {
 897       char buf[2048];
 898
 899       print_insn (buf, insn, 0);
 900       buf[40] = 0;
 901       fprintf (sched_dump, ";;\t%3i--> %-40s:", clock, buf);
 902
 903       if (recog_memoized (insn) < 0)
 904         fprintf (sched_dump, "nothing");
 905       else
 906         print_reservation (sched_dump, insn);
 907       fputc ('\n', sched_dump);
 908     }
 909
 910   if (INSN_TICK (insn) > clock)
 911     {
 912       /* 'insn' has been prematurely moved from the queue to the
 913          ready list.  */
 914       premature_issue = INSN_TICK (insn) - clock;
 915     }
 916
 917   for (link = INSN_DEPEND (insn); link != 0; link = XEXP (link, 1))
 918     {
 919       rtx next = XEXP (link, 0);
 920       int cost = insn_cost (insn, link, next);
 921
 922       INSN_TICK (next) = MAX (INSN_TICK (next), clock + cost + premature_issue);
 923
 924       if ((INSN_DEP_COUNT (next) -= 1) == 0)
 925         {
 926           int effective_cost = INSN_TICK (next) - clock;
 927
 928           if (! (*current_sched_info->new_ready) (next))
 929             continue;
 930
 931           if (sched_verbose >= 2)
 932             {
 933               fprintf (sched_dump, ";;\t\tdependences resolved: insn %s ",
 934                        (*current_sched_info->print_insn) (next, 0));
 935
 936               if (effective_cost < 1)
 937                 fprintf (sched_dump, "into ready\n");
 938               else
 939                 fprintf (sched_dump, "into queue with cost=%d\n",
 940                          effective_cost);
 941             }
 942
 943           /* Adjust the priority of NEXT and either put it on the ready
 944              list or queue it.  */
 945           adjust_priority (next);
 946           if (effective_cost < 1)
 947             ready_add (ready, next);
 948           else
 949             {
 950               queue_insn (next, effective_cost);
 951
 952               if (SCHED_GROUP_P (next) && advance < effective_cost)
 953                 advance = effective_cost;
 954             }
 955         }
 956     }
 957
 958   /* Annotate the instruction with issue information -- TImode
 959      indicates that the instruction is expected not to be able
 960      to issue on the same cycle as the previous insn.  A machine
 961      may use this information to decide how the instruction should
 962      be aligned.  */
 963   if (issue_rate > 1
 964       && GET_CODE (PATTERN (insn)) != USE
 965       && GET_CODE (PATTERN (insn)) != CLOBBER)
 966     {
 967       if (reload_completed)
 968         PUT_MODE (insn, clock > last_clock_var ? TImode : VOIDmode);
 969       last_clock_var = clock;
 970     }
 971   return advance;
 972 }
 973
 974 /* Functions for handling of notes.  */
 975
 976 /* Delete notes beginning with INSN and put them in the chain
 977    of notes ended by NOTE_LIST.
 978    Returns the insn following the notes.  */
 979
 980 static rtx
 981 unlink_other_notes (rtx insn, rtx tail)
 982 {
 983   rtx prev = PREV_INSN (insn);
 984
 985   while (insn != tail && NOTE_P (insn))
 986     {
 987       rtx next = NEXT_INSN (insn);
 988       /* Delete the note from its current position.  */
 989       if (prev)
 990         NEXT_INSN (prev) = next;
 991       if (next)
 992         PREV_INSN (next) = prev;
 993
 994       /* See sched_analyze to see how these are handled.  */
 995       if (NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG
 996           && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_END
 997           && NOTE_LINE_NUMBER (insn) != NOTE_INSN_BASIC_BLOCK
 998           && NOTE_LINE_NUMBER (insn) != NOTE_INSN_EH_REGION_BEG
 999           && NOTE_LINE_NUMBER (insn) != NOTE_INSN_EH_REGION_END)
1000         {
1001           /* Insert the note at the end of the notes list.  */
1002           PREV_INSN (insn) = note_list;
1003           if (note_list)
1004             NEXT_INSN (note_list) = insn;
1005           note_list = insn;
1006         }
1007
1008       insn = next;
1009     }
1010   return insn;
1011 }
1012
1013 /* Delete line notes beginning with INSN. Record line-number notes so
1014    they can be reused.  Returns the insn following the notes.  */
1015
1016 static rtx
1017 unlink_line_notes (rtx insn, rtx tail)
1018 {
1019   rtx prev = PREV_INSN (insn);
1020
1021   while (insn != tail && NOTE_P (insn))
1022     {
1023       rtx next = NEXT_INSN (insn);
1024
1025       if (write_symbols != NO_DEBUG && NOTE_LINE_NUMBER (insn) > 0)
1026         {
1027           /* Delete the note from its current position.  */
1028           if (prev)
1029             NEXT_INSN (prev) = next;
1030           if (next)
1031             PREV_INSN (next) = prev;
1032
1033           /* Record line-number notes so they can be reused.  */
1034           LINE_NOTE (insn) = insn;
1035         }
1036       else
1037         prev = insn;
1038
1039       insn = next;
1040     }
1041   return insn;
1042 }
1043
1044 /* Return the head and tail pointers of BB.  */
1045
1046 void
1047 get_block_head_tail (int b, rtx *headp, rtx *tailp)
1048 {
1049   /* HEAD and TAIL delimit the basic block being scheduled.  */
1050   rtx head = BB_HEAD (BASIC_BLOCK (b));
1051   rtx tail = BB_END (BASIC_BLOCK (b));
1052
1053   /* Don't include any notes or labels at the beginning of the
1054      basic block, or notes at the ends of basic blocks.  */
1055   while (head != tail)
1056     {
1057       if (NOTE_P (head))
1058         head = NEXT_INSN (head);
1059       else if (NOTE_P (tail))
1060         tail = PREV_INSN (tail);
1061       else if (LABEL_P (head))
1062         head = NEXT_INSN (head);
1063       else
1064         break;
1065     }
1066
1067   *headp = head;
1068   *tailp = tail;
1069 }
1070
1071 /* Return nonzero if there are no real insns in the range [ HEAD, TAIL ].  */
1072
1073 int
1074 no_real_insns_p (rtx head, rtx tail)
1075 {
1076   while (head != NEXT_INSN (tail))
1077     {
1078       if (!NOTE_P (head) && !LABEL_P (head))
1079         return 0;
1080       head = NEXT_INSN (head);
1081     }
1082   return 1;
1083 }
1084
1085 /* Delete line notes from one block. Save them so they can be later restored
1086    (in restore_line_notes).  HEAD and TAIL are the boundaries of the
1087    block in which notes should be processed.  */
1088
1089 void
1090 rm_line_notes (rtx head, rtx tail)
1091 {
1092   rtx next_tail;
1093   rtx insn;
1094
1095   next_tail = NEXT_INSN (tail);
1096   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1097     {
1098       rtx prev;
1099
1100       /* Farm out notes, and maybe save them in NOTE_LIST.
1101          This is needed to keep the debugger from
1102          getting completely deranged.  */
1103       if (NOTE_P (insn))
1104         {
1105           prev = insn;
1106           insn = unlink_line_notes (insn, next_tail);
1107
1108           if (prev == tail)
1109             abort ();
1110           if (prev == head)
1111             abort ();
1112           if (insn == next_tail)
1113             abort ();
1114         }
1115     }
1116 }
1117
1118 /* Save line number notes for each insn in block B.  HEAD and TAIL are
1119    the boundaries of the block in which notes should be processed.  */
1120
1121 void
1122 save_line_notes (int b, rtx head, rtx tail)
1123 {
1124   rtx next_tail;
1125
1126   /* We must use the true line number for the first insn in the block
1127      that was computed and saved at the start of this pass.  We can't
1128      use the current line number, because scheduling of the previous
1129      block may have changed the current line number.  */
1130
1131   rtx line = line_note_head[b];
1132   rtx insn;
1133
1134   next_tail = NEXT_INSN (tail);
1135
1136   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1137     if (NOTE_P (insn) && NOTE_LINE_NUMBER (insn) > 0)
1138       line = insn;
1139     else
1140       LINE_NOTE (insn) = line;
1141 }
1142
1143 /* After a block was scheduled, insert line notes into the insns list.
1144    HEAD and TAIL are the boundaries of the block in which notes should
1145    be processed.  */
1146
1147 void
1148 restore_line_notes (rtx head, rtx tail)
1149 {
1150   rtx line, note, prev, new;
1151   int added_notes = 0;
1152   rtx next_tail, insn;
1153
1154   head = head;
1155   next_tail = NEXT_INSN (tail);
1156
1157   /* Determine the current line-number.  We want to know the current
1158      line number of the first insn of the block here, in case it is
1159      different from the true line number that was saved earlier.  If
1160      different, then we need a line number note before the first insn
1161      of this block.  If it happens to be the same, then we don't want to
1162      emit another line number note here.  */
1163   for (line = head; line; line = PREV_INSN (line))
1164     if (NOTE_P (line) && NOTE_LINE_NUMBER (line) > 0)
1165       break;
1166
1167   /* Walk the insns keeping track of the current line-number and inserting
1168      the line-number notes as needed.  */
1169   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1170     if (NOTE_P (insn) && NOTE_LINE_NUMBER (insn) > 0)
1171       line = insn;
1172   /* This used to emit line number notes before every non-deleted note.
1173      However, this confuses a debugger, because line notes not separated
1174      by real instructions all end up at the same address.  I can find no
1175      use for line number notes before other notes, so none are emitted.  */
1176     else if (!NOTE_P (insn)
1177              && INSN_UID (insn) < old_max_uid
1178              && (note = LINE_NOTE (insn)) != 0
1179              && note != line
1180              && (line == 0
1181 #ifdef USE_MAPPED_LOCATION
1182                  || NOTE_SOURCE_LOCATION (note) != NOTE_SOURCE_LOCATION (line)
1183 #else
1184                  || NOTE_LINE_NUMBER (note) != NOTE_LINE_NUMBER (line)
1185                  || NOTE_SOURCE_FILE (note) != NOTE_SOURCE_FILE (line)
1186 #endif
1187                  ))
1188       {
1189         line = note;
1190         prev = PREV_INSN (insn);
1191         if (LINE_NOTE (note))
1192           {
1193             /* Re-use the original line-number note.  */
1194             LINE_NOTE (note) = 0;
1195             PREV_INSN (note) = prev;
1196             NEXT_INSN (prev) = note;
1197             PREV_INSN (insn) = note;
1198             NEXT_INSN (note) = insn;
1199           }
1200         else
1201           {
1202             added_notes++;
1203             new = emit_note_after (NOTE_LINE_NUMBER (note), prev);
1204 #ifndef USE_MAPPED_LOCATION
1205             NOTE_SOURCE_FILE (new) = NOTE_SOURCE_FILE (note);
1206 #endif
1207           }
1208       }
1209   if (sched_verbose && added_notes)
1210     fprintf (sched_dump, ";; added %d line-number notes\n", added_notes);
1211 }
1212
1213 /* After scheduling the function, delete redundant line notes from the
1214    insns list.  */
1215
1216 void
1217 rm_redundant_line_notes (void)
1218 {
1219   rtx line = 0;
1220   rtx insn = get_insns ();
1221   int active_insn = 0;
1222   int notes = 0;
1223
1224   /* Walk the insns deleting redundant line-number notes.  Many of these
1225      are already present.  The remainder tend to occur at basic
1226      block boundaries.  */
1227   for (insn = get_last_insn (); insn; insn = PREV_INSN (insn))
1228     if (NOTE_P (insn) && NOTE_LINE_NUMBER (insn) > 0)
1229       {
1230         /* If there are no active insns following, INSN is redundant.  */
1231         if (active_insn == 0)
1232           {
1233             notes++;
1234             SET_INSN_DELETED (insn);
1235           }
1236         /* If the line number is unchanged, LINE is redundant.  */
1237         else if (line
1238 #ifdef USE_MAPPED_LOCATION
1239                  && NOTE_SOURCE_LOCATION (line) == NOTE_SOURCE_LOCATION (insn)
1240 #else
1241                  && NOTE_LINE_NUMBER (line) == NOTE_LINE_NUMBER (insn)
1242                  && NOTE_SOURCE_FILE (line) == NOTE_SOURCE_FILE (insn)
1243 #endif
1244 )
1245           {
1246             notes++;
1247             SET_INSN_DELETED (line);
1248             line = insn;
1249           }
1250         else
1251           line = insn;
1252         active_insn = 0;
1253       }
1254     else if (!((NOTE_P (insn)
1255                 && NOTE_LINE_NUMBER (insn) == NOTE_INSN_DELETED)
1256                || (NONJUMP_INSN_P (insn)
1257                    && (GET_CODE (PATTERN (insn)) == USE
1258                        || GET_CODE (PATTERN (insn)) == CLOBBER))))
1259       active_insn++;
1260
1261   if (sched_verbose && notes)
1262     fprintf (sched_dump, ";; deleted %d line-number notes\n", notes);
1263 }
1264
1265 /* Delete notes between HEAD and TAIL and put them in the chain
1266    of notes ended by NOTE_LIST.  */
1267
1268 void
1269 rm_other_notes (rtx head, rtx tail)
1270 {
1271   rtx next_tail;
1272   rtx insn;
1273
1274   note_list = 0;
1275   if (head == tail && (! INSN_P (head)))
1276     return;
1277
1278   next_tail = NEXT_INSN (tail);
1279   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1280     {
1281       rtx prev;
1282
1283       /* Farm out notes, and maybe save them in NOTE_LIST.
1284          This is needed to keep the debugger from
1285          getting completely deranged.  */
1286       if (NOTE_P (insn))
1287         {
1288           prev = insn;
1289
1290           insn = unlink_other_notes (insn, next_tail);
1291
1292           if (prev == tail)
1293             abort ();
1294           if (prev == head)
1295             abort ();
1296           if (insn == next_tail)
1297             abort ();
1298         }
1299     }
1300 }
1301
1302 /* Functions for computation of registers live/usage info.  */
1303
1304 /* This function looks for a new register being defined.
1305    If the destination register is already used by the source,
1306    a new register is not needed.  */
1307
1308 static int
1309 find_set_reg_weight (rtx x)
1310 {
1311   if (GET_CODE (x) == CLOBBER
1312       && register_operand (SET_DEST (x), VOIDmode))
1313     return 1;
1314   if (GET_CODE (x) == SET
1315       && register_operand (SET_DEST (x), VOIDmode))
1316     {
1317       if (REG_P (SET_DEST (x)))
1318         {
1319           if (!reg_mentioned_p (SET_DEST (x), SET_SRC (x)))
1320             return 1;
1321           else
1322             return 0;
1323         }
1324       return 1;
1325     }
1326   return 0;
1327 }
1328
1329 /* Calculate INSN_REG_WEIGHT for all insns of a block.  */
1330
1331 static void
1332 find_insn_reg_weight (int b)
1333 {
1334   rtx insn, next_tail, head, tail;
1335
1336   get_block_head_tail (b, &head, &tail);
1337   next_tail = NEXT_INSN (tail);
1338
1339   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1340     {
1341       int reg_weight = 0;
1342       rtx x;
1343
1344       /* Handle register life information.  */
1345       if (! INSN_P (insn))
1346         continue;
1347
1348       /* Increment weight for each register born here.  */
1349       x = PATTERN (insn);
1350       reg_weight += find_set_reg_weight (x);
1351       if (GET_CODE (x) == PARALLEL)
1352         {
1353           int j;
1354           for (j = XVECLEN (x, 0) - 1; j >= 0; j--)
1355             {
1356               x = XVECEXP (PATTERN (insn), 0, j);
1357               reg_weight += find_set_reg_weight (x);
1358             }
1359         }
1360       /* Decrement weight for each register that dies here.  */
1361       for (x = REG_NOTES (insn); x; x = XEXP (x, 1))
1362         {
1363           if (REG_NOTE_KIND (x) == REG_DEAD
1364               || REG_NOTE_KIND (x) == REG_UNUSED)
1365             reg_weight--;
1366         }
1367
1368       INSN_REG_WEIGHT (insn) = reg_weight;
1369     }
1370 }
1371
1372 /* Scheduling clock, modified in schedule_block() and queue_to_ready ().  */
1373 static int clock_var;
1374
1375 /* Move insns that became ready to fire from queue to ready list.  */
1376
1377 static void
1378 queue_to_ready (struct ready_list *ready)
1379 {
1380   rtx insn;
1381   rtx link;
1382
1383   q_ptr = NEXT_Q (q_ptr);
1384
1385   /* Add all pending insns that can be scheduled without stalls to the
1386      ready list.  */
1387   for (link = insn_queue[q_ptr]; link; link = XEXP (link, 1))
1388     {
1389       insn = XEXP (link, 0);
1390       q_size -= 1;
1391
1392       if (sched_verbose >= 2)
1393         fprintf (sched_dump, ";;\t\tQ-->Ready: insn %s: ",
1394                  (*current_sched_info->print_insn) (insn, 0));
1395
1396       ready_add (ready, insn);
1397       if (sched_verbose >= 2)
1398         fprintf (sched_dump, "moving to ready without stalls\n");
1399     }
1400   insn_queue[q_ptr] = 0;
1401
1402   /* If there are no ready insns, stall until one is ready and add all
1403      of the pending insns at that point to the ready list.  */
1404   if (ready->n_ready == 0)
1405     {
1406       int stalls;
1407
1408       for (stalls = 1; stalls <= max_insn_queue_index; stalls++)
1409         {
1410           if ((link = insn_queue[NEXT_Q_AFTER (q_ptr, stalls)]))
1411             {
1412               for (; link; link = XEXP (link, 1))
1413                 {
1414                   insn = XEXP (link, 0);
1415                   q_size -= 1;
1416
1417                   if (sched_verbose >= 2)
1418                     fprintf (sched_dump, ";;\t\tQ-->Ready: insn %s: ",
1419                              (*current_sched_info->print_insn) (insn, 0));
1420
1421                   ready_add (ready, insn);
1422                   if (sched_verbose >= 2)
1423                     fprintf (sched_dump, "moving to ready with %d stalls\n", stalls);
1424                 }
1425               insn_queue[NEXT_Q_AFTER (q_ptr, stalls)] = 0;
1426
1427               advance_one_cycle ();
1428
1429               break;
1430             }
1431
1432           advance_one_cycle ();
1433         }
1434
1435       q_ptr = NEXT_Q_AFTER (q_ptr, stalls);
1436       clock_var += stalls;
1437     }
1438 }
1439
1440 /* Used by early_queue_to_ready.  Determines whether it is "ok" to
1441    prematurely move INSN from the queue to the ready list.  Currently,
1442    if a target defines the hook 'is_costly_dependence', this function
1443    uses the hook to check whether there exist any dependences which are
1444    considered costly by the target, between INSN and other insns that
1445    have already been scheduled.  Dependences are checked up to Y cycles
1446    back, with default Y=1; The flag -fsched-stalled-insns-dep=Y allows
1447    controlling this value.
1448    (Other considerations could be taken into account instead (or in
1449    addition) depending on user flags and target hooks.  */
1450
1451 static bool
1452 ok_for_early_queue_removal (rtx insn)
1453 {
1454   int n_cycles;
1455   rtx prev_insn = last_scheduled_insn;
1456
1457   if (targetm.sched.is_costly_dependence)
1458     {
1459       for (n_cycles = flag_sched_stalled_insns_dep; n_cycles; n_cycles--)
1460         {
1461           for ( ; prev_insn; prev_insn = PREV_INSN (prev_insn))
1462             {
1463               rtx dep_link = 0;
1464               int dep_cost;
1465
1466               if (!NOTE_P (prev_insn))
1467                 {
1468                   dep_link = find_insn_list (insn, INSN_DEPEND (prev_insn));
1469                   if (dep_link)
1470                     {
1471                       dep_cost = insn_cost (prev_insn, dep_link, insn) ;
1472                       if (targetm.sched.is_costly_dependence (prev_insn, insn,
1473                                 dep_link, dep_cost,
1474                                 flag_sched_stalled_insns_dep - n_cycles))
1475                         return false;
1476                     }
1477                 }
1478
1479               if (GET_MODE (prev_insn) == TImode) /* end of dispatch group */
1480                 break;
1481             }
1482
1483           if (!prev_insn)
1484             break;
1485           prev_insn = PREV_INSN (prev_insn);
1486         }
1487     }
1488
1489   return true;
1490 }
1491
1492
1493 /* Remove insns from the queue, before they become "ready" with respect
1494    to FU latency considerations.  */
1495
1496 static int
1497 early_queue_to_ready (state_t state, struct ready_list *ready)
1498 {
1499   rtx insn;
1500   rtx link;
1501   rtx next_link;
1502   rtx prev_link;
1503   bool move_to_ready;
1504   int cost;
1505   state_t temp_state = alloca (dfa_state_size);
1506   int stalls;
1507   int insns_removed = 0;
1508
1509   /*
1510      Flag '-fsched-stalled-insns=X' determines the aggressiveness of this
1511      function:
1512
1513      X == 0: There is no limit on how many queued insns can be removed
1514              prematurely.  (flag_sched_stalled_insns = -1).
1515
1516      X >= 1: Only X queued insns can be removed prematurely in each
1517              invocation.  (flag_sched_stalled_insns = X).
1518
1519      Otherwise: Early queue removal is disabled.
1520          (flag_sched_stalled_insns = 0)
1521   */
1522
1523   if (! flag_sched_stalled_insns)
1524     return 0;
1525
1526   for (stalls = 0; stalls <= max_insn_queue_index; stalls++)
1527     {
1528       if ((link = insn_queue[NEXT_Q_AFTER (q_ptr, stalls)]))
1529         {
1530           if (sched_verbose > 6)
1531             fprintf (sched_dump, ";; look at index %d + %d\n", q_ptr, stalls);
1532
1533           prev_link = 0;
1534           while (link)
1535             {
1536               next_link = XEXP (link, 1);
1537               insn = XEXP (link, 0);
1538               if (insn && sched_verbose > 6)
1539                 print_rtl_single (sched_dump, insn);
1540
1541               memcpy (temp_state, state, dfa_state_size);
1542               if (recog_memoized (insn) < 0)
1543                 /* non-negative to indicate that it's not ready
1544                    to avoid infinite Q->R->Q->R... */
1545                 cost = 0;
1546               else
1547                 cost = state_transition (temp_state, insn);
1548
1549               if (sched_verbose >= 6)
1550                 fprintf (sched_dump, "transition cost = %d\n", cost);
1551
1552               move_to_ready = false;
1553               if (cost < 0)
1554                 {
1555                   move_to_ready = ok_for_early_queue_removal (insn);
1556                   if (move_to_ready == true)
1557                     {
1558                       /* move from Q to R */
1559                       q_size -= 1;
1560                       ready_add (ready, insn);
1561
1562                       if (prev_link)
1563                         XEXP (prev_link, 1) = next_link;
1564                       else
1565                         insn_queue[NEXT_Q_AFTER (q_ptr, stalls)] = next_link;
1566
1567                       free_INSN_LIST_node (link);
1568
1569                       if (sched_verbose >= 2)
1570                         fprintf (sched_dump, ";;\t\tEarly Q-->Ready: insn %s\n",
1571                                  (*current_sched_info->print_insn) (insn, 0));
1572
1573                       insns_removed++;
1574                       if (insns_removed == flag_sched_stalled_insns)
1575                         /* Remove only one insn from Q at a time.  */
1576                         return insns_removed;
1577                     }
1578                 }
1579
1580               if (move_to_ready == false)
1581                 prev_link = link;
1582
1583               link = next_link;
1584             } /* while link */
1585         } /* if link */
1586
1587     } /* for stalls.. */
1588
1589   return insns_removed;
1590 }
1591
1592
1593 /* Print the ready list for debugging purposes.  Callable from debugger.  */
1594
1595 static void
1596 debug_ready_list (struct ready_list *ready)
1597 {
1598   rtx *p;
1599   int i;
1600
1601   if (ready->n_ready == 0)
1602     {
1603       fprintf (sched_dump, "\n");
1604       return;
1605     }
1606
1607   p = ready_lastpos (ready);
1608   for (i = 0; i < ready->n_ready; i++)
1609     fprintf (sched_dump, "  %s", (*current_sched_info->print_insn) (p[i], 0));
1610   fprintf (sched_dump, "\n");
1611 }
1612
1613 /* move_insn1: Remove INSN from insn chain, and link it after LAST insn.  */
1614
1615 static rtx
1616 move_insn1 (rtx insn, rtx last)
1617 {
1618   NEXT_INSN (PREV_INSN (insn)) = NEXT_INSN (insn);
1619   PREV_INSN (NEXT_INSN (insn)) = PREV_INSN (insn);
1620
1621   NEXT_INSN (insn) = NEXT_INSN (last);
1622   PREV_INSN (NEXT_INSN (last)) = insn;
1623
1624   NEXT_INSN (last) = insn;
1625   PREV_INSN (insn) = last;
1626
1627   return insn;
1628 }
1629
1630 /* Search INSN for REG_SAVE_NOTE note pairs for
1631    NOTE_INSN_{LOOP,EHREGION}_{BEG,END}; and convert them back into
1632    NOTEs.  The REG_SAVE_NOTE note following first one is contains the
1633    saved value for NOTE_BLOCK_NUMBER which is useful for
1634    NOTE_INSN_EH_REGION_{BEG,END} NOTEs.  LAST is the last instruction
1635    output by the instruction scheduler.  Return the new value of LAST.  */
1636
1637 static rtx
1638 reemit_notes (rtx insn, rtx last)
1639 {
1640   rtx note, retval;
1641
1642   retval = last;
1643   for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
1644     {
1645       if (REG_NOTE_KIND (note) == REG_SAVE_NOTE)
1646         {
1647           enum insn_note note_type = INTVAL (XEXP (note, 0));
1648
1649           last = emit_note_before (note_type, last);
1650           remove_note (insn, note);
1651           note = XEXP (note, 1);
1652           if (note_type == NOTE_INSN_EH_REGION_BEG
1653               || note_type == NOTE_INSN_EH_REGION_END)
1654             NOTE_EH_HANDLER (last) = INTVAL (XEXP (note, 0));
1655           remove_note (insn, note);
1656         }
1657     }
1658   return retval;
1659 }
1660
1661 /* Move INSN.  Reemit notes if needed.
1662
1663    Return the last insn emitted by the scheduler, which is the
1664    return value from the first call to reemit_notes.  */
1665
1666 static rtx
1667 move_insn (rtx insn, rtx last)
1668 {
1669   rtx retval = NULL;
1670
1671   move_insn1 (insn, last);
1672
1673   /* If this is the first call to reemit_notes, then record
1674      its return value.  */
1675   if (retval == NULL_RTX)
1676     retval = reemit_notes (insn, insn);
1677   else
1678     reemit_notes (insn, insn);
1679
1680   SCHED_GROUP_P (insn) = 0;
1681
1682   return retval;
1683 }
1684
1685 /* The following structure describe an entry of the stack of choices.  */
1686 struct choice_entry
1687 {
1688   /* Ordinal number of the issued insn in the ready queue.  */
1689   int index;
1690   /* The number of the rest insns whose issues we should try.  */
1691   int rest;
1692   /* The number of issued essential insns.  */
1693   int n;
1694   /* State after issuing the insn.  */
1695   state_t state;
1696 };
1697
1698 /* The following array is used to implement a stack of choices used in
1699    function max_issue.  */
1700 static struct choice_entry *choice_stack;
1701
1702 /* The following variable value is number of essential insns issued on
1703    the current cycle.  An insn is essential one if it changes the
1704    processors state.  */
1705 static int cycle_issued_insns;
1706
1707 /* The following variable value is maximal number of tries of issuing
1708    insns for the first cycle multipass insn scheduling.  We define
1709    this value as constant*(DFA_LOOKAHEAD**ISSUE_RATE).  We would not
1710    need this constraint if all real insns (with non-negative codes)
1711    had reservations because in this case the algorithm complexity is
1712    O(DFA_LOOKAHEAD**ISSUE_RATE).  Unfortunately, the dfa descriptions
1713    might be incomplete and such insn might occur.  For such
1714    descriptions, the complexity of algorithm (without the constraint)
1715    could achieve DFA_LOOKAHEAD ** N , where N is the queue length.  */
1716 static int max_lookahead_tries;
1717
1718 /* The following value is value of hook
1719    `first_cycle_multipass_dfa_lookahead' at the last call of
1720    `max_issue'.  */
1721 static int cached_first_cycle_multipass_dfa_lookahead = 0;
1722
1723 /* The following value is value of `issue_rate' at the last call of
1724    `sched_init'.  */
1725 static int cached_issue_rate = 0;
1726
1727 /* The following function returns maximal (or close to maximal) number
1728    of insns which can be issued on the same cycle and one of which
1729    insns is insns with the best rank (the first insn in READY).  To
1730    make this function tries different samples of ready insns.  READY
1731    is current queue `ready'.  Global array READY_TRY reflects what
1732    insns are already issued in this try.  INDEX will contain index
1733    of the best insn in READY.  The following function is used only for
1734    first cycle multipass scheduling.  */
1735 static int
1736 max_issue (struct ready_list *ready, int *index)
1737 {
1738   int n, i, all, n_ready, best, delay, tries_num;
1739   struct choice_entry *top;
1740   rtx insn;
1741
1742   best = 0;
1743   memcpy (choice_stack->state, curr_state, dfa_state_size);
1744   top = choice_stack;
1745   top->rest = cached_first_cycle_multipass_dfa_lookahead;
1746   top->n = 0;
1747   n_ready = ready->n_ready;
1748   for (all = i = 0; i < n_ready; i++)
1749     if (!ready_try [i])
1750       all++;
1751   i = 0;
1752   tries_num = 0;
1753   for (;;)
1754     {
1755       if (top->rest == 0 || i >= n_ready)
1756         {
1757           if (top == choice_stack)
1758             break;
1759           if (best < top - choice_stack && ready_try [0])
1760             {
1761               best = top - choice_stack;
1762               *index = choice_stack [1].index;
1763               if (top->n == issue_rate - cycle_issued_insns || best == all)
1764                 break;
1765             }
1766           i = top->index;
1767           ready_try [i] = 0;
1768           top--;
1769           memcpy (curr_state, top->state, dfa_state_size);
1770         }
1771       else if (!ready_try [i])
1772         {
1773           tries_num++;
1774           if (tries_num > max_lookahead_tries)
1775             break;
1776           insn = ready_element (ready, i);
1777           delay = state_transition (curr_state, insn);
1778           if (delay < 0)
1779             {
1780               if (state_dead_lock_p (curr_state))
1781                 top->rest = 0;
1782               else
1783                 top->rest--;
1784               n = top->n;
1785               if (memcmp (top->state, curr_state, dfa_state_size) != 0)
1786                 n++;
1787               top++;
1788               top->rest = cached_first_cycle_multipass_dfa_lookahead;
1789               top->index = i;
1790               top->n = n;
1791               memcpy (top->state, curr_state, dfa_state_size);
1792               ready_try [i] = 1;
1793               i = -1;
1794             }
1795         }
1796       i++;
1797     }
1798   while (top != choice_stack)
1799     {
1800       ready_try [top->index] = 0;
1801       top--;
1802     }
1803   memcpy (curr_state, choice_stack->state, dfa_state_size);
1804   return best;
1805 }
1806
1807 /* The following function chooses insn from READY and modifies
1808    *N_READY and READY.  The following function is used only for first
1809    cycle multipass scheduling.  */
1810
1811 static rtx
1812 choose_ready (struct ready_list *ready)
1813 {
1814   int lookahead = 0;
1815
1816   if (targetm.sched.first_cycle_multipass_dfa_lookahead)
1817     lookahead = targetm.sched.first_cycle_multipass_dfa_lookahead ();
1818   if (lookahead <= 0 || SCHED_GROUP_P (ready_element (ready, 0)))
1819     return ready_remove_first (ready);
1820   else
1821     {
1822       /* Try to choose the better insn.  */
1823       int index = 0, i;
1824       rtx insn;
1825
1826       if (cached_first_cycle_multipass_dfa_lookahead != lookahead)
1827         {
1828           cached_first_cycle_multipass_dfa_lookahead = lookahead;
1829           max_lookahead_tries = 100;
1830           for (i = 0; i < issue_rate; i++)
1831             max_lookahead_tries *= lookahead;
1832         }
1833       insn = ready_element (ready, 0);
1834       if (INSN_CODE (insn) < 0)
1835         return ready_remove_first (ready);
1836       for (i = 1; i < ready->n_ready; i++)
1837         {
1838           insn = ready_element (ready, i);
1839           ready_try [i]
1840             = (INSN_CODE (insn) < 0
1841                || (targetm.sched.first_cycle_multipass_dfa_lookahead_guard
1842                    && !targetm.sched.first_cycle_multipass_dfa_lookahead_guard (insn)));
1843         }
1844       if (max_issue (ready, &index) == 0)
1845         return ready_remove_first (ready);
1846       else
1847         return ready_remove (ready, index);
1848     }
1849 }
1850
1851 /* Use forward list scheduling to rearrange insns of block B in region RGN,
1852    possibly bringing insns from subsequent blocks in the same region.  */
1853
1854 void
1855 schedule_block (int b, int rgn_n_insns)
1856 {
1857   struct ready_list ready;
1858   int i, first_cycle_insn_p;
1859   int can_issue_more;
1860   state_t temp_state = NULL;  /* It is used for multipass scheduling.  */
1861   int sort_p, advance, start_clock_var;
1862
1863   /* Head/tail info for this block.  */
1864   rtx prev_head = current_sched_info->prev_head;
1865   rtx next_tail = current_sched_info->next_tail;
1866   rtx head = NEXT_INSN (prev_head);
1867   rtx tail = PREV_INSN (next_tail);
1868
1869   /* We used to have code to avoid getting parameters moved from hard
1870      argument registers into pseudos.
1871
1872      However, it was removed when it proved to be of marginal benefit
1873      and caused problems because schedule_block and compute_forward_dependences
1874      had different notions of what the "head" insn was.  */
1875
1876   if (head == tail && (! INSN_P (head)))
1877     abort ();
1878
1879   /* Debug info.  */
1880   if (sched_verbose)
1881     {
1882       fprintf (sched_dump, ";;   ======================================================\n");
1883       fprintf (sched_dump,
1884                ";;   -- basic block %d from %d to %d -- %s reload\n",
1885                b, INSN_UID (head), INSN_UID (tail),
1886                (reload_completed ? "after" : "before"));
1887       fprintf (sched_dump, ";;   ======================================================\n");
1888       fprintf (sched_dump, "\n");
1889     }
1890
1891   state_reset (curr_state);
1892
1893   /* Allocate the ready list.  */
1894   ready.veclen = rgn_n_insns + 1 + issue_rate;
1895   ready.first = ready.veclen - 1;
1896   ready.vec = xmalloc (ready.veclen * sizeof (rtx));
1897   ready.n_ready = 0;
1898
1899   /* It is used for first cycle multipass scheduling.  */
1900   temp_state = alloca (dfa_state_size);
1901   ready_try = xcalloc ((rgn_n_insns + 1), sizeof (char));
1902   choice_stack = xmalloc ((rgn_n_insns + 1)
1903                           * sizeof (struct choice_entry));
1904   for (i = 0; i <= rgn_n_insns; i++)
1905     choice_stack[i].state = xmalloc (dfa_state_size);
1906
1907   (*current_sched_info->init_ready_list) (&ready);
1908
1909   if (targetm.sched.md_init)
1910     targetm.sched.md_init (sched_dump, sched_verbose, ready.veclen);
1911
1912   /* We start inserting insns after PREV_HEAD.  */
1913   last_scheduled_insn = prev_head;
1914
1915   /* Initialize INSN_QUEUE.  Q_SIZE is the total number of insns in the
1916      queue.  */
1917   q_ptr = 0;
1918   q_size = 0;
1919
1920   insn_queue = alloca ((max_insn_queue_index + 1) * sizeof (rtx));
1921   memset (insn_queue, 0, (max_insn_queue_index + 1) * sizeof (rtx));
1922   last_clock_var = -1;
1923
1924   /* Start just before the beginning of time.  */
1925   clock_var = -1;
1926   advance = 0;
1927
1928   sort_p = TRUE;
1929   /* Loop until all the insns in BB are scheduled.  */
1930   while ((*current_sched_info->schedule_more_p) ())
1931     {
1932       do
1933         {
1934           start_clock_var = clock_var;
1935
1936           clock_var++;
1937
1938           advance_one_cycle ();
1939
1940           /* Add to the ready list all pending insns that can be issued now.
1941              If there are no ready insns, increment clock until one
1942              is ready and add all pending insns at that point to the ready
1943              list.  */
1944           queue_to_ready (&ready);
1945
1946           if (ready.n_ready == 0)
1947             abort ();
1948
1949           if (sched_verbose >= 2)
1950             {
1951               fprintf (sched_dump, ";;\t\tReady list after queue_to_ready:  ");
1952               debug_ready_list (&ready);
1953             }
1954           advance -= clock_var - start_clock_var;
1955         }
1956       while (advance > 0);
1957
1958       if (sort_p)
1959         {
1960           /* Sort the ready list based on priority.  */
1961           ready_sort (&ready);
1962
1963           if (sched_verbose >= 2)
1964             {
1965               fprintf (sched_dump, ";;\t\tReady list after ready_sort:  ");
1966               debug_ready_list (&ready);
1967             }
1968         }
1969
1970       /* Allow the target to reorder the list, typically for
1971          better instruction bundling.  */
1972       if (sort_p && targetm.sched.reorder
1973           && (ready.n_ready == 0
1974               || !SCHED_GROUP_P (ready_element (&ready, 0))))
1975         can_issue_more =
1976           targetm.sched.reorder (sched_dump, sched_verbose,
1977                                  ready_lastpos (&ready),
1978                                  &ready.n_ready, clock_var);
1979       else
1980         can_issue_more = issue_rate;
1981
1982       first_cycle_insn_p = 1;
1983       cycle_issued_insns = 0;
1984       for (;;)
1985         {
1986           rtx insn;
1987           int cost;
1988           bool asm_p = false;
1989
1990           if (sched_verbose >= 2)
1991             {
1992               fprintf (sched_dump, ";;\tReady list (t =%3d):  ",
1993                        clock_var);
1994               debug_ready_list (&ready);
1995             }
1996
1997           if (ready.n_ready == 0
1998               && can_issue_more
1999               && reload_completed)
2000             {
2001               /* Allow scheduling insns directly from the queue in case
2002                  there's nothing better to do (ready list is empty) but
2003                  there are still vacant dispatch slots in the current cycle.  */
2004               if (sched_verbose >= 6)
2005                 fprintf(sched_dump,";;\t\tSecond chance\n");
2006               memcpy (temp_state, curr_state, dfa_state_size);
2007               if (early_queue_to_ready (temp_state, &ready))
2008                 ready_sort (&ready);
2009             }
2010
2011           if (ready.n_ready == 0 || !can_issue_more
2012               || state_dead_lock_p (curr_state)
2013               || !(*current_sched_info->schedule_more_p) ())
2014             break;
2015
2016           /* Select and remove the insn from the ready list.  */
2017           if (sort_p)
2018             insn = choose_ready (&ready);
2019           else
2020             insn = ready_remove_first (&ready);
2021
2022           if (targetm.sched.dfa_new_cycle
2023               && targetm.sched.dfa_new_cycle (sched_dump, sched_verbose,
2024                                               insn, last_clock_var,
2025                                               clock_var, &sort_p))
2026             {
2027               ready_add (&ready, insn);
2028               break;
2029             }
2030
2031           sort_p = TRUE;
2032           memcpy (temp_state, curr_state, dfa_state_size);
2033           if (recog_memoized (insn) < 0)
2034             {
2035               asm_p = (GET_CODE (PATTERN (insn)) == ASM_INPUT
2036                        || asm_noperands (PATTERN (insn)) >= 0);
2037               if (!first_cycle_insn_p && asm_p)
2038                 /* This is asm insn which is tryed to be issued on the
2039                    cycle not first.  Issue it on the next cycle.  */
2040                 cost = 1;
2041               else
2042                 /* A USE insn, or something else we don't need to
2043                    understand.  We can't pass these directly to
2044                    state_transition because it will trigger a
2045                    fatal error for unrecognizable insns.  */
2046                 cost = 0;
2047             }
2048           else
2049             {
2050               cost = state_transition (temp_state, insn);
2051               if (cost < 0)
2052                 cost = 0;
2053               else if (cost == 0)
2054                 cost = 1;
2055             }
2056
2057           if (cost >= 1)
2058             {
2059               queue_insn (insn, cost);
2060               continue;
2061             }
2062
2063           if (! (*current_sched_info->can_schedule_ready_p) (insn))
2064             goto next;
2065
2066           last_scheduled_insn = move_insn (insn, last_scheduled_insn);
2067
2068           if (memcmp (curr_state, temp_state, dfa_state_size) != 0)
2069             cycle_issued_insns++;
2070           memcpy (curr_state, temp_state, dfa_state_size);
2071
2072           if (targetm.sched.variable_issue)
2073             can_issue_more =
2074               targetm.sched.variable_issue (sched_dump, sched_verbose,
2075                                                insn, can_issue_more);
2076           /* A naked CLOBBER or USE generates no instruction, so do
2077              not count them against the issue rate.  */
2078           else if (GET_CODE (PATTERN (insn)) != USE
2079                    && GET_CODE (PATTERN (insn)) != CLOBBER)
2080             can_issue_more--;
2081
2082           advance = schedule_insn (insn, &ready, clock_var);
2083
2084           /* After issuing an asm insn we should start a new cycle.  */
2085           if (advance == 0 && asm_p)
2086             advance = 1;
2087           if (advance != 0)
2088             break;
2089
2090         next:
2091           first_cycle_insn_p = 0;
2092
2093           /* Sort the ready list based on priority.  This must be
2094              redone here, as schedule_insn may have readied additional
2095              insns that will not be sorted correctly.  */
2096           if (ready.n_ready > 0)
2097             ready_sort (&ready);
2098
2099           if (targetm.sched.reorder2
2100               && (ready.n_ready == 0
2101                   || !SCHED_GROUP_P (ready_element (&ready, 0))))
2102             {
2103               can_issue_more =
2104                 targetm.sched.reorder2 (sched_dump, sched_verbose,
2105                                         ready.n_ready
2106                                         ? ready_lastpos (&ready) : NULL,
2107                                         &ready.n_ready, clock_var);
2108             }
2109         }
2110     }
2111
2112   if (targetm.sched.md_finish)
2113     targetm.sched.md_finish (sched_dump, sched_verbose);
2114
2115   /* Debug info.  */
2116   if (sched_verbose)
2117     {
2118       fprintf (sched_dump, ";;\tReady list (final):  ");
2119       debug_ready_list (&ready);
2120     }
2121
2122   /* Sanity check -- queue must be empty now.  Meaningless if region has
2123      multiple bbs.  */
2124   if (current_sched_info->queue_must_finish_empty && q_size != 0)
2125       abort ();
2126
2127   /* Update head/tail boundaries.  */
2128   head = NEXT_INSN (prev_head);
2129   tail = last_scheduled_insn;
2130
2131   if (!reload_completed)
2132     {
2133       rtx insn, link, next;
2134
2135       /* INSN_TICK (minimum clock tick at which the insn becomes
2136          ready) may be not correct for the insn in the subsequent
2137          blocks of the region.  We should use a correct value of
2138          `clock_var' or modify INSN_TICK.  It is better to keep
2139          clock_var value equal to 0 at the start of a basic block.
2140          Therefore we modify INSN_TICK here.  */
2141       for (insn = head; insn != tail; insn = NEXT_INSN (insn))
2142         if (INSN_P (insn))
2143           {
2144             for (link = INSN_DEPEND (insn); link != 0; link = XEXP (link, 1))
2145               {
2146                 next = XEXP (link, 0);
2147                 INSN_TICK (next) -= clock_var;
2148               }
2149           }
2150     }
2151
2152   /* Restore-other-notes: NOTE_LIST is the end of a chain of notes
2153      previously found among the insns.  Insert them at the beginning
2154      of the insns.  */
2155   if (note_list != 0)
2156     {
2157       rtx note_head = note_list;
2158
2159       while (PREV_INSN (note_head))
2160         {
2161           note_head = PREV_INSN (note_head);
2162         }
2163
2164       PREV_INSN (note_head) = PREV_INSN (head);
2165       NEXT_INSN (PREV_INSN (head)) = note_head;
2166       PREV_INSN (head) = note_list;
2167       NEXT_INSN (note_list) = head;
2168       head = note_head;
2169     }
2170
2171   /* Debugging.  */
2172   if (sched_verbose)
2173     {
2174       fprintf (sched_dump, ";;   total time = %d\n;;   new head = %d\n",
2175                clock_var, INSN_UID (head));
2176       fprintf (sched_dump, ";;   new tail = %d\n\n",
2177                INSN_UID (tail));
2178     }
2179
2180   current_sched_info->head = head;
2181   current_sched_info->tail = tail;
2182
2183   free (ready.vec);
2184
2185   free (ready_try);
2186   for (i = 0; i <= rgn_n_insns; i++)
2187     free (choice_stack [i].state);
2188   free (choice_stack);
2189 }
2190 \f
2191 /* Set_priorities: compute priority of each insn in the block.  */
2192
2193 int
2194 set_priorities (rtx head, rtx tail)
2195 {
2196   rtx insn;
2197   int n_insn;
2198   int sched_max_insns_priority =
2199         current_sched_info->sched_max_insns_priority;
2200   rtx prev_head;
2201
2202   prev_head = PREV_INSN (head);
2203
2204   if (head == tail && (! INSN_P (head)))
2205     return 0;
2206
2207   n_insn = 0;
2208   sched_max_insns_priority = 0;
2209   for (insn = tail; insn != prev_head; insn = PREV_INSN (insn))
2210     {
2211       if (NOTE_P (insn))
2212         continue;
2213
2214       n_insn++;
2215       (void) priority (insn);
2216
2217       if (INSN_PRIORITY_KNOWN (insn))
2218         sched_max_insns_priority =
2219           MAX (sched_max_insns_priority, INSN_PRIORITY (insn));
2220     }
2221   sched_max_insns_priority += 1;
2222   current_sched_info->sched_max_insns_priority =
2223         sched_max_insns_priority;
2224
2225   return n_insn;
2226 }
2227
2228 /* Initialize some global state for the scheduler.  DUMP_FILE is to be used
2229    for debugging output.  */
2230
2231 void
2232 sched_init (FILE *dump_file)
2233 {
2234   int luid;
2235   basic_block b;
2236   rtx insn;
2237   int i;
2238
2239   /* Disable speculative loads in their presence if cc0 defined.  */
2240 #ifdef HAVE_cc0
2241   flag_schedule_speculative_load = 0;
2242 #endif
2243
2244   /* Set dump and sched_verbose for the desired debugging output.  If no
2245      dump-file was specified, but -fsched-verbose=N (any N), print to stderr.
2246      For -fsched-verbose=N, N>=10, print everything to stderr.  */
2247   sched_verbose = sched_verbose_param;
2248   if (sched_verbose_param == 0 && dump_file)
2249     sched_verbose = 1;
2250   sched_dump = ((sched_verbose_param >= 10 || !dump_file)
2251                 ? stderr : dump_file);
2252
2253   /* Initialize issue_rate.  */
2254   if (targetm.sched.issue_rate)
2255     issue_rate = targetm.sched.issue_rate ();
2256   else
2257     issue_rate = 1;
2258
2259   if (cached_issue_rate != issue_rate)
2260     {
2261       cached_issue_rate = issue_rate;
2262       /* To invalidate max_lookahead_tries:  */
2263       cached_first_cycle_multipass_dfa_lookahead = 0;
2264     }
2265
2266   /* We use LUID 0 for the fake insn (UID 0) which holds dependencies for
2267      pseudos which do not cross calls.  */
2268   old_max_uid = get_max_uid () + 1;
2269
2270   h_i_d = xcalloc (old_max_uid, sizeof (*h_i_d));
2271
2272   for (i = 0; i < old_max_uid; i++)
2273     h_i_d [i].cost = -1;
2274
2275   if (targetm.sched.init_dfa_pre_cycle_insn)
2276     targetm.sched.init_dfa_pre_cycle_insn ();
2277
2278   if (targetm.sched.init_dfa_post_cycle_insn)
2279     targetm.sched.init_dfa_post_cycle_insn ();
2280
2281   dfa_start ();
2282   dfa_state_size = state_size ();
2283   curr_state = xmalloc (dfa_state_size);
2284
2285   h_i_d[0].luid = 0;
2286   luid = 1;
2287   FOR_EACH_BB (b)
2288     for (insn = BB_HEAD (b); ; insn = NEXT_INSN (insn))
2289       {
2290         INSN_LUID (insn) = luid;
2291
2292         /* Increment the next luid, unless this is a note.  We don't
2293            really need separate IDs for notes and we don't want to
2294            schedule differently depending on whether or not there are
2295            line-number notes, i.e., depending on whether or not we're
2296            generating debugging information.  */
2297         if (!NOTE_P (insn))
2298           ++luid;
2299
2300         if (insn == BB_END (b))
2301           break;
2302       }
2303
2304   init_dependency_caches (luid);
2305
2306   init_alias_analysis ();
2307
2308   if (write_symbols != NO_DEBUG)
2309     {
2310       rtx line;
2311
2312       line_note_head = xcalloc (last_basic_block, sizeof (rtx));
2313
2314       /* Save-line-note-head:
2315          Determine the line-number at the start of each basic block.
2316          This must be computed and saved now, because after a basic block's
2317          predecessor has been scheduled, it is impossible to accurately
2318          determine the correct line number for the first insn of the block.  */
2319
2320       FOR_EACH_BB (b)
2321         {
2322           for (line = BB_HEAD (b); line; line = PREV_INSN (line))
2323             if (NOTE_P (line) && NOTE_LINE_NUMBER (line) > 0)
2324               {
2325                 line_note_head[b->index] = line;
2326                 break;
2327               }
2328           /* Do a forward search as well, since we won't get to see the first
2329              notes in a basic block.  */
2330           for (line = BB_HEAD (b); line; line = NEXT_INSN (line))
2331             {
2332               if (INSN_P (line))
2333                 break;
2334               if (NOTE_P (line) && NOTE_LINE_NUMBER (line) > 0)
2335                 line_note_head[b->index] = line;
2336             }
2337         }
2338     }
2339
2340   /* ??? Add a NOTE after the last insn of the last basic block.  It is not
2341      known why this is done.  */
2342
2343   insn = BB_END (EXIT_BLOCK_PTR->prev_bb);
2344   if (NEXT_INSN (insn) == 0
2345       || (!NOTE_P (insn)
2346           && !LABEL_P (insn)
2347           /* Don't emit a NOTE if it would end up before a BARRIER.  */
2348           && !BARRIER_P (NEXT_INSN (insn))))
2349     {
2350       emit_note_after (NOTE_INSN_DELETED, BB_END (EXIT_BLOCK_PTR->prev_bb));
2351       /* Make insn to appear outside BB.  */
2352       BB_END (EXIT_BLOCK_PTR->prev_bb) = PREV_INSN (BB_END (EXIT_BLOCK_PTR->prev_bb));
2353     }
2354
2355   /* Compute INSN_REG_WEIGHT for all blocks.  We must do this before
2356      removing death notes.  */
2357   FOR_EACH_BB_REVERSE (b)
2358     find_insn_reg_weight (b->index);
2359
2360   if (targetm.sched.md_init_global)
2361       targetm.sched.md_init_global (sched_dump, sched_verbose, old_max_uid);
2362 }
2363
2364 /* Free global data used during insn scheduling.  */
2365
2366 void
2367 sched_finish (void)
2368 {
2369   free (h_i_d);
2370   free (curr_state);
2371   dfa_finish ();
2372   free_dependency_caches ();
2373   end_alias_analysis ();
2374   if (write_symbols != NO_DEBUG)
2375     free (line_note_head);
2376
2377   if (targetm.sched.md_finish_global)
2378       targetm.sched.md_finish_global (sched_dump, sched_verbose);
2379 }
2380 #endif /* INSN_SCHEDULING */