gcc/haifa-sched.c

   1 /* Instruction scheduling pass.
   2    Copyright (C) 1992, 1993, 1994, 1995, 1996, 1997, 1998,
   3    1999, 2000, 2001, 2002 Free Software Foundation, Inc.
   4    Contributed by Michael Tiemann (tiemann@cygnus.com) Enhanced by,
   5    and currently maintained by, Jim Wilson (wilson@cygnus.com)
   6
   7 This file is part of GCC.
   8
   9 GCC is free software; you can redistribute it and/or modify it under
  10 the terms of the GNU General Public License as published by the Free
  11 Software Foundation; either version 2, or (at your option) any later
  12 version.
  13
  14 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  15 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  16 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  17 for more details.
  18
  19 You should have received a copy of the GNU General Public License
  20 along with GCC; see the file COPYING.  If not, write to the Free
  21 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  22 02111-1307, USA.  */
  23
  24 /* Instruction scheduling pass.  This file, along with sched-deps.c,
  25    contains the generic parts.  The actual entry point is found for
  26    the normal instruction scheduling pass is found in sched-rgn.c.
  27
  28    We compute insn priorities based on data dependencies.  Flow
  29    analysis only creates a fraction of the data-dependencies we must
  30    observe: namely, only those dependencies which the combiner can be
  31    expected to use.  For this pass, we must therefore create the
  32    remaining dependencies we need to observe: register dependencies,
  33    memory dependencies, dependencies to keep function calls in order,
  34    and the dependence between a conditional branch and the setting of
  35    condition codes are all dealt with here.
  36
  37    The scheduler first traverses the data flow graph, starting with
  38    the last instruction, and proceeding to the first, assigning values
  39    to insn_priority as it goes.  This sorts the instructions
  40    topologically by data dependence.
  41
  42    Once priorities have been established, we order the insns using
  43    list scheduling.  This works as follows: starting with a list of
  44    all the ready insns, and sorted according to priority number, we
  45    schedule the insn from the end of the list by placing its
  46    predecessors in the list according to their priority order.  We
  47    consider this insn scheduled by setting the pointer to the "end" of
  48    the list to point to the previous insn.  When an insn has no
  49    predecessors, we either queue it until sufficient time has elapsed
  50    or add it to the ready list.  As the instructions are scheduled or
  51    when stalls are introduced, the queue advances and dumps insns into
  52    the ready list.  When all insns down to the lowest priority have
  53    been scheduled, the critical path of the basic block has been made
  54    as short as possible.  The remaining insns are then scheduled in
  55    remaining slots.
  56
  57    Function unit conflicts are resolved during forward list scheduling
  58    by tracking the time when each insn is committed to the schedule
  59    and from that, the time the function units it uses must be free.
  60    As insns on the ready list are considered for scheduling, those
  61    that would result in a blockage of the already committed insns are
  62    queued until no blockage will result.
  63
  64    The following list shows the order in which we want to break ties
  65    among insns in the ready list:
  66
  67    1.  choose insn with the longest path to end of bb, ties
  68    broken by
  69    2.  choose insn with least contribution to register pressure,
  70    ties broken by
  71    3.  prefer in-block upon interblock motion, ties broken by
  72    4.  prefer useful upon speculative motion, ties broken by
  73    5.  choose insn with largest control flow probability, ties
  74    broken by
  75    6.  choose insn with the least dependences upon the previously
  76    scheduled insn, or finally
  77    7   choose the insn which has the most insns dependent on it.
  78    8.  choose insn with lowest UID.
  79
  80    Memory references complicate matters.  Only if we can be certain
  81    that memory references are not part of the data dependency graph
  82    (via true, anti, or output dependence), can we move operations past
  83    memory references.  To first approximation, reads can be done
  84    independently, while writes introduce dependencies.  Better
  85    approximations will yield fewer dependencies.
  86
  87    Before reload, an extended analysis of interblock data dependences
  88    is required for interblock scheduling.  This is performed in
  89    compute_block_backward_dependences ().
  90
  91    Dependencies set up by memory references are treated in exactly the
  92    same way as other dependencies, by using LOG_LINKS backward
  93    dependences.  LOG_LINKS are translated into INSN_DEPEND forward
  94    dependences for the purpose of forward list scheduling.
  95
  96    Having optimized the critical path, we may have also unduly
  97    extended the lifetimes of some registers.  If an operation requires
  98    that constants be loaded into registers, it is certainly desirable
  99    to load those constants as early as necessary, but no earlier.
 100    I.e., it will not do to load up a bunch of registers at the
 101    beginning of a basic block only to use them at the end, if they
 102    could be loaded later, since this may result in excessive register
 103    utilization.
 104
 105    Note that since branches are never in basic blocks, but only end
 106    basic blocks, this pass will not move branches.  But that is ok,
 107    since we can use GNU's delayed branch scheduling pass to take care
 108    of this case.
 109
 110    Also note that no further optimizations based on algebraic
 111    identities are performed, so this pass would be a good one to
 112    perform instruction splitting, such as breaking up a multiply
 113    instruction into shifts and adds where that is profitable.
 114
 115    Given the memory aliasing analysis that this pass should perform,
 116    it should be possible to remove redundant stores to memory, and to
 117    load values from registers instead of hitting memory.
 118
 119    Before reload, speculative insns are moved only if a 'proof' exists
 120    that no exception will be caused by this, and if no live registers
 121    exist that inhibit the motion (live registers constraints are not
 122    represented by data dependence edges).
 123
 124    This pass must update information that subsequent passes expect to
 125    be correct.  Namely: reg_n_refs, reg_n_sets, reg_n_deaths,
 126    reg_n_calls_crossed, and reg_live_length.  Also, BLOCK_HEAD,
 127    BLOCK_END.
 128
 129    The information in the line number notes is carefully retained by
 130    this pass.  Notes that refer to the starting and ending of
 131    exception regions are also carefully retained by this pass.  All
 132    other NOTE insns are grouped in their same relative order at the
 133    beginning of basic blocks and regions that have been scheduled.  */
 134 \f
 135 #include "config.h"
 136 #include "system.h"
 137 #include "toplev.h"
 138 #include "rtl.h"
 139 #include "tm_p.h"
 140 #include "hard-reg-set.h"
 141 #include "basic-block.h"
 142 #include "regs.h"
 143 #include "function.h"
 144 #include "flags.h"
 145 #include "insn-config.h"
 146 #include "insn-attr.h"
 147 #include "except.h"
 148 #include "toplev.h"
 149 #include "recog.h"
 150 #include "sched-int.h"
 151 #include "target.h"
 152
 153 #ifdef INSN_SCHEDULING
 154
 155 /* issue_rate is the number of insns that can be scheduled in the same
 156    machine cycle.  It can be defined in the config/mach/mach.h file,
 157    otherwise we set it to 1.  */
 158
 159 static int issue_rate;
 160
 161 /* If the following variable value is non zero, the scheduler inserts
 162    bubbles (nop insns).  The value of variable affects on scheduler
 163    behavior only if automaton pipeline interface with multipass
 164    scheduling is used and hook dfa_bubble is defined.  */
 165 int insert_schedule_bubbles_p = 0;
 166
 167 /* sched-verbose controls the amount of debugging output the
 168    scheduler prints.  It is controlled by -fsched-verbose=N:
 169    N>0 and no -DSR : the output is directed to stderr.
 170    N>=10 will direct the printouts to stderr (regardless of -dSR).
 171    N=1: same as -dSR.
 172    N=2: bb's probabilities, detailed ready list info, unit/insn info.
 173    N=3: rtl at abort point, control-flow, regions info.
 174    N=5: dependences info.  */
 175
 176 static int sched_verbose_param = 0;
 177 int sched_verbose = 0;
 178
 179 /* Debugging file.  All printouts are sent to dump, which is always set,
 180    either to stderr, or to the dump listing file (-dRS).  */
 181 FILE *sched_dump = 0;
 182
 183 /* Highest uid before scheduling.  */
 184 static int old_max_uid;
 185
 186 /* fix_sched_param() is called from toplev.c upon detection
 187    of the -fsched-verbose=N option.  */
 188
 189 void
 190 fix_sched_param (param, val)
 191      const char *param, *val;
 192 {
 193   if (!strcmp (param, "verbose"))
 194     sched_verbose_param = atoi (val);
 195   else
 196     warning ("fix_sched_param: unknown param: %s", param);
 197 }
 198
 199 struct haifa_insn_data *h_i_d;
 200
 201 #define DONE_PRIORITY   -1
 202 #define MAX_PRIORITY    0x7fffffff
 203 #define TAIL_PRIORITY   0x7ffffffe
 204 #define LAUNCH_PRIORITY 0x7f000001
 205 #define DONE_PRIORITY_P(INSN) (INSN_PRIORITY (INSN) < 0)
 206 #define LOW_PRIORITY_P(INSN) ((INSN_PRIORITY (INSN) & 0x7f000000) == 0)
 207
 208 #define LINE_NOTE(INSN)         (h_i_d[INSN_UID (INSN)].line_note)
 209 #define INSN_TICK(INSN)         (h_i_d[INSN_UID (INSN)].tick)
 210
 211 /* Vector indexed by basic block number giving the starting line-number
 212    for each basic block.  */
 213 static rtx *line_note_head;
 214
 215 /* List of important notes we must keep around.  This is a pointer to the
 216    last element in the list.  */
 217 static rtx note_list;
 218
 219 /* Queues, etc.  */
 220
 221 /* An instruction is ready to be scheduled when all insns preceding it
 222    have already been scheduled.  It is important to ensure that all
 223    insns which use its result will not be executed until its result
 224    has been computed.  An insn is maintained in one of four structures:
 225
 226    (P) the "Pending" set of insns which cannot be scheduled until
 227    their dependencies have been satisfied.
 228    (Q) the "Queued" set of insns that can be scheduled when sufficient
 229    time has passed.
 230    (R) the "Ready" list of unscheduled, uncommitted insns.
 231    (S) the "Scheduled" list of insns.
 232
 233    Initially, all insns are either "Pending" or "Ready" depending on
 234    whether their dependencies are satisfied.
 235
 236    Insns move from the "Ready" list to the "Scheduled" list as they
 237    are committed to the schedule.  As this occurs, the insns in the
 238    "Pending" list have their dependencies satisfied and move to either
 239    the "Ready" list or the "Queued" set depending on whether
 240    sufficient time has passed to make them ready.  As time passes,
 241    insns move from the "Queued" set to the "Ready" list.  Insns may
 242    move from the "Ready" list to the "Queued" set if they are blocked
 243    due to a function unit conflict.
 244
 245    The "Pending" list (P) are the insns in the INSN_DEPEND of the unscheduled
 246    insns, i.e., those that are ready, queued, and pending.
 247    The "Queued" set (Q) is implemented by the variable `insn_queue'.
 248    The "Ready" list (R) is implemented by the variables `ready' and
 249    `n_ready'.
 250    The "Scheduled" list (S) is the new insn chain built by this pass.
 251
 252    The transition (R->S) is implemented in the scheduling loop in
 253    `schedule_block' when the best insn to schedule is chosen.
 254    The transition (R->Q) is implemented in `queue_insn' when an
 255    insn is found to have a function unit conflict with the already
 256    committed insns.
 257    The transitions (P->R and P->Q) are implemented in `schedule_insn' as
 258    insns move from the ready list to the scheduled list.
 259    The transition (Q->R) is implemented in 'queue_to_insn' as time
 260    passes or stalls are introduced.  */
 261
 262 /* Implement a circular buffer to delay instructions until sufficient
 263    time has passed.  For the old pipeline description interface,
 264    INSN_QUEUE_SIZE is a power of two larger than MAX_BLOCKAGE and
 265    MAX_READY_COST computed by genattr.c.  For the new pipeline
 266    description interface, MAX_INSN_QUEUE_INDEX is a power of two minus
 267    one which is larger than maximal time of instruction execution
 268    computed by genattr.c on the base maximal time of functional unit
 269    reservations and geting a result.  This is the longest time an
 270    insn may be queued.  */
 271
 272 #define MAX_INSN_QUEUE_INDEX max_insn_queue_index_macro_value
 273
 274 static rtx *insn_queue;
 275 static int q_ptr = 0;
 276 static int q_size = 0;
 277 #define NEXT_Q(X) (((X)+1) & MAX_INSN_QUEUE_INDEX)
 278 #define NEXT_Q_AFTER(X, C) (((X)+C) & MAX_INSN_QUEUE_INDEX)
 279
 280 /* The following variable defines value for macro
 281    MAX_INSN_QUEUE_INDEX.  */
 282 static int max_insn_queue_index_macro_value;
 283
 284 /* The following variable value refers for all current and future
 285    reservations of the processor units.  */
 286 state_t curr_state;
 287
 288 /* The following variable value is size of memory representing all
 289    current and future reservations of the processor units.  It is used
 290    only by DFA based scheduler.  */
 291 static size_t dfa_state_size;
 292
 293 /* The following array is used to find the best insn from ready when
 294    the automaton pipeline interface is used.  */
 295 static char *ready_try;
 296
 297 /* Describe the ready list of the scheduler.
 298    VEC holds space enough for all insns in the current region.  VECLEN
 299    says how many exactly.
 300    FIRST is the index of the element with the highest priority; i.e. the
 301    last one in the ready list, since elements are ordered by ascending
 302    priority.
 303    N_READY determines how many insns are on the ready list.  */
 304
 305 struct ready_list
 306 {
 307   rtx *vec;
 308   int veclen;
 309   int first;
 310   int n_ready;
 311 };
 312
 313 /* Forward declarations.  */
 314
 315 /* The scheduler using only DFA description should never use the
 316    following five functions:  */
 317 static unsigned int blockage_range PARAMS ((int, rtx));
 318 static void clear_units PARAMS ((void));
 319 static void schedule_unit PARAMS ((int, rtx, int));
 320 static int actual_hazard PARAMS ((int, rtx, int, int));
 321 static int potential_hazard PARAMS ((int, rtx, int));
 322
 323 static int priority PARAMS ((rtx));
 324 static int rank_for_schedule PARAMS ((const PTR, const PTR));
 325 static void swap_sort PARAMS ((rtx *, int));
 326 static void queue_insn PARAMS ((rtx, int));
 327 static void schedule_insn PARAMS ((rtx, struct ready_list *, int));
 328 static void find_insn_reg_weight PARAMS ((int));
 329 static void adjust_priority PARAMS ((rtx));
 330 static void advance_one_cycle PARAMS ((void));
 331
 332 /* Notes handling mechanism:
 333    =========================
 334    Generally, NOTES are saved before scheduling and restored after scheduling.
 335    The scheduler distinguishes between three types of notes:
 336
 337    (1) LINE_NUMBER notes, generated and used for debugging.  Here,
 338    before scheduling a region, a pointer to the LINE_NUMBER note is
 339    added to the insn following it (in save_line_notes()), and the note
 340    is removed (in rm_line_notes() and unlink_line_notes()).  After
 341    scheduling the region, this pointer is used for regeneration of
 342    the LINE_NUMBER note (in restore_line_notes()).
 343
 344    (2) LOOP_BEGIN, LOOP_END, SETJMP, EHREGION_BEG, EHREGION_END notes:
 345    Before scheduling a region, a pointer to the note is added to the insn
 346    that follows or precedes it.  (This happens as part of the data dependence
 347    computation).  After scheduling an insn, the pointer contained in it is
 348    used for regenerating the corresponding note (in reemit_notes).
 349
 350    (3) All other notes (e.g. INSN_DELETED):  Before scheduling a block,
 351    these notes are put in a list (in rm_other_notes() and
 352    unlink_other_notes ()).  After scheduling the block, these notes are
 353    inserted at the beginning of the block (in schedule_block()).  */
 354
 355 static rtx unlink_other_notes PARAMS ((rtx, rtx));
 356 static rtx unlink_line_notes PARAMS ((rtx, rtx));
 357 static rtx reemit_notes PARAMS ((rtx, rtx));
 358
 359 static rtx *ready_lastpos PARAMS ((struct ready_list *));
 360 static void ready_sort PARAMS ((struct ready_list *));
 361 static rtx ready_remove_first PARAMS ((struct ready_list *));
 362
 363 static void queue_to_ready PARAMS ((struct ready_list *));
 364
 365 static void debug_ready_list PARAMS ((struct ready_list *));
 366
 367 static rtx move_insn1 PARAMS ((rtx, rtx));
 368 static rtx move_insn PARAMS ((rtx, rtx));
 369
 370 /* The following functions are used to implement multi-pass scheduling
 371    on the first cycle.  It is used only for DFA based scheduler.  */
 372 static rtx ready_element PARAMS ((struct ready_list *, int));
 373 static rtx ready_remove PARAMS ((struct ready_list *, int));
 374 static int max_issue PARAMS ((struct ready_list *, state_t, int *));
 375
 376 static rtx choose_ready PARAMS ((struct ready_list *));
 377
 378 #endif /* INSN_SCHEDULING */
 379 \f
 380 /* Point to state used for the current scheduling pass.  */
 381 struct sched_info *current_sched_info;
 382 \f
 383 #ifndef INSN_SCHEDULING
 384 void
 385 schedule_insns (dump_file)
 386      FILE *dump_file ATTRIBUTE_UNUSED;
 387 {
 388 }
 389 #else
 390
 391 /* Pointer to the last instruction scheduled.  Used by rank_for_schedule,
 392    so that insns independent of the last scheduled insn will be preferred
 393    over dependent instructions.  */
 394
 395 static rtx last_scheduled_insn;
 396
 397 /* Compute the function units used by INSN.  This caches the value
 398    returned by function_units_used.  A function unit is encoded as the
 399    unit number if the value is non-negative and the compliment of a
 400    mask if the value is negative.  A function unit index is the
 401    non-negative encoding.  The scheduler using only DFA description
 402    should never use the following function.  */
 403
 404 HAIFA_INLINE int
 405 insn_unit (insn)
 406      rtx insn;
 407 {
 408   int unit = INSN_UNIT (insn);
 409
 410   if (unit == 0)
 411     {
 412       recog_memoized (insn);
 413
 414       /* A USE insn, or something else we don't need to understand.
 415          We can't pass these directly to function_units_used because it will
 416          trigger a fatal error for unrecognizable insns.  */
 417       if (INSN_CODE (insn) < 0)
 418         unit = -1;
 419       else
 420         {
 421           unit = function_units_used (insn);
 422           /* Increment non-negative values so we can cache zero.  */
 423           if (unit >= 0)
 424             unit++;
 425         }
 426       /* We only cache 16 bits of the result, so if the value is out of
 427          range, don't cache it.  */
 428       if (FUNCTION_UNITS_SIZE < HOST_BITS_PER_SHORT
 429           || unit >= 0
 430           || (unit & ~((1 << (HOST_BITS_PER_SHORT - 1)) - 1)) == 0)
 431         INSN_UNIT (insn) = unit;
 432     }
 433   return (unit > 0 ? unit - 1 : unit);
 434 }
 435
 436 /* Compute the blockage range for executing INSN on UNIT.  This caches
 437    the value returned by the blockage_range_function for the unit.
 438    These values are encoded in an int where the upper half gives the
 439    minimum value and the lower half gives the maximum value.  The
 440    scheduler using only DFA description should never use the following
 441    function.  */
 442
 443 HAIFA_INLINE static unsigned int
 444 blockage_range (unit, insn)
 445      int unit;
 446      rtx insn;
 447 {
 448   unsigned int blockage = INSN_BLOCKAGE (insn);
 449   unsigned int range;
 450
 451   if ((int) UNIT_BLOCKED (blockage) != unit + 1)
 452     {
 453       range = function_units[unit].blockage_range_function (insn);
 454       /* We only cache the blockage range for one unit and then only if
 455          the values fit.  */
 456       if (HOST_BITS_PER_INT >= UNIT_BITS + 2 * BLOCKAGE_BITS)
 457         INSN_BLOCKAGE (insn) = ENCODE_BLOCKAGE (unit + 1, range);
 458     }
 459   else
 460     range = BLOCKAGE_RANGE (blockage);
 461
 462   return range;
 463 }
 464
 465 /* A vector indexed by function unit instance giving the last insn to
 466    use the unit.  The value of the function unit instance index for
 467    unit U instance I is (U + I * FUNCTION_UNITS_SIZE).  The scheduler
 468    using only DFA description should never use the following variable.  */
 469 #if FUNCTION_UNITS_SIZE
 470 static rtx unit_last_insn[FUNCTION_UNITS_SIZE * MAX_MULTIPLICITY];
 471 #else
 472 static rtx unit_last_insn[1];
 473 #endif
 474
 475 /* A vector indexed by function unit instance giving the minimum time
 476    when the unit will unblock based on the maximum blockage cost.  The
 477    scheduler using only DFA description should never use the following
 478    variable.  */
 479 #if FUNCTION_UNITS_SIZE
 480 static int unit_tick[FUNCTION_UNITS_SIZE * MAX_MULTIPLICITY];
 481 #else
 482 static int unit_tick[1];
 483 #endif
 484
 485 /* A vector indexed by function unit number giving the number of insns
 486    that remain to use the unit.  The scheduler using only DFA
 487    description should never use the following variable.  */
 488 #if FUNCTION_UNITS_SIZE
 489 static int unit_n_insns[FUNCTION_UNITS_SIZE];
 490 #else
 491 static int unit_n_insns[1];
 492 #endif
 493
 494 /* Access the unit_last_insn array.  Used by the visualization code.
 495    The scheduler using only DFA description should never use the
 496    following function.  */
 497
 498 rtx
 499 get_unit_last_insn (instance)
 500      int instance;
 501 {
 502   return unit_last_insn[instance];
 503 }
 504
 505 /* Reset the function unit state to the null state.  */
 506
 507 static void
 508 clear_units ()
 509 {
 510   memset ((char *) unit_last_insn, 0, sizeof (unit_last_insn));
 511   memset ((char *) unit_tick, 0, sizeof (unit_tick));
 512   memset ((char *) unit_n_insns, 0, sizeof (unit_n_insns));
 513 }
 514
 515 /* Return the issue-delay of an insn.  The scheduler using only DFA
 516    description should never use the following function.  */
 517
 518 HAIFA_INLINE int
 519 insn_issue_delay (insn)
 520      rtx insn;
 521 {
 522   int i, delay = 0;
 523   int unit = insn_unit (insn);
 524
 525   /* Efficiency note: in fact, we are working 'hard' to compute a
 526      value that was available in md file, and is not available in
 527      function_units[] structure.  It would be nice to have this
 528      value there, too.  */
 529   if (unit >= 0)
 530     {
 531       if (function_units[unit].blockage_range_function &&
 532           function_units[unit].blockage_function)
 533         delay = function_units[unit].blockage_function (insn, insn);
 534     }
 535   else
 536     for (i = 0, unit = ~unit; unit; i++, unit >>= 1)
 537       if ((unit & 1) != 0 && function_units[i].blockage_range_function
 538           && function_units[i].blockage_function)
 539         delay = MAX (delay, function_units[i].blockage_function (insn, insn));
 540
 541   return delay;
 542 }
 543
 544 /* Return the actual hazard cost of executing INSN on the unit UNIT,
 545    instance INSTANCE at time CLOCK if the previous actual hazard cost
 546    was COST.  The scheduler using only DFA description should never
 547    use the following function.  */
 548
 549 HAIFA_INLINE int
 550 actual_hazard_this_instance (unit, instance, insn, clock, cost)
 551      int unit, instance, clock, cost;
 552      rtx insn;
 553 {
 554   int tick = unit_tick[instance]; /* Issue time of the last issued insn.  */
 555
 556   if (tick - clock > cost)
 557     {
 558       /* The scheduler is operating forward, so unit's last insn is the
 559          executing insn and INSN is the candidate insn.  We want a
 560          more exact measure of the blockage if we execute INSN at CLOCK
 561          given when we committed the execution of the unit's last insn.
 562
 563          The blockage value is given by either the unit's max blockage
 564          constant, blockage range function, or blockage function.  Use
 565          the most exact form for the given unit.  */
 566
 567       if (function_units[unit].blockage_range_function)
 568         {
 569           if (function_units[unit].blockage_function)
 570             tick += (function_units[unit].blockage_function
 571                      (unit_last_insn[instance], insn)
 572                      - function_units[unit].max_blockage);
 573           else
 574             tick += ((int) MAX_BLOCKAGE_COST (blockage_range (unit, insn))
 575                      - function_units[unit].max_blockage);
 576         }
 577       if (tick - clock > cost)
 578         cost = tick - clock;
 579     }
 580   return cost;
 581 }
 582
 583 /* Record INSN as having begun execution on the units encoded by UNIT
 584    at time CLOCK.  The scheduler using only DFA description should
 585    never use the following function.  */
 586
 587 HAIFA_INLINE static void
 588 schedule_unit (unit, insn, clock)
 589      int unit, clock;
 590      rtx insn;
 591 {
 592   int i;
 593
 594   if (unit >= 0)
 595     {
 596       int instance = unit;
 597 #if MAX_MULTIPLICITY > 1
 598       /* Find the first free instance of the function unit and use that
 599          one.  We assume that one is free.  */
 600       for (i = function_units[unit].multiplicity - 1; i > 0; i--)
 601         {
 602           if (!actual_hazard_this_instance (unit, instance, insn, clock, 0))
 603             break;
 604           instance += FUNCTION_UNITS_SIZE;
 605         }
 606 #endif
 607       unit_last_insn[instance] = insn;
 608       unit_tick[instance] = (clock + function_units[unit].max_blockage);
 609     }
 610   else
 611     for (i = 0, unit = ~unit; unit; i++, unit >>= 1)
 612       if ((unit & 1) != 0)
 613         schedule_unit (i, insn, clock);
 614 }
 615
 616 /* Return the actual hazard cost of executing INSN on the units
 617    encoded by UNIT at time CLOCK if the previous actual hazard cost
 618    was COST.  The scheduler using only DFA description should never
 619    use the following function.  */
 620
 621 HAIFA_INLINE static int
 622 actual_hazard (unit, insn, clock, cost)
 623      int unit, clock, cost;
 624      rtx insn;
 625 {
 626   int i;
 627
 628   if (unit >= 0)
 629     {
 630       /* Find the instance of the function unit with the minimum hazard.  */
 631       int instance = unit;
 632       int best_cost = actual_hazard_this_instance (unit, instance, insn,
 633                                                    clock, cost);
 634 #if MAX_MULTIPLICITY > 1
 635       int this_cost;
 636
 637       if (best_cost > cost)
 638         {
 639           for (i = function_units[unit].multiplicity - 1; i > 0; i--)
 640             {
 641               instance += FUNCTION_UNITS_SIZE;
 642               this_cost = actual_hazard_this_instance (unit, instance, insn,
 643                                                        clock, cost);
 644               if (this_cost < best_cost)
 645                 {
 646                   best_cost = this_cost;
 647                   if (this_cost <= cost)
 648                     break;
 649                 }
 650             }
 651         }
 652 #endif
 653       cost = MAX (cost, best_cost);
 654     }
 655   else
 656     for (i = 0, unit = ~unit; unit; i++, unit >>= 1)
 657       if ((unit & 1) != 0)
 658         cost = actual_hazard (i, insn, clock, cost);
 659
 660   return cost;
 661 }
 662
 663 /* Return the potential hazard cost of executing an instruction on the
 664    units encoded by UNIT if the previous potential hazard cost was
 665    COST.  An insn with a large blockage time is chosen in preference
 666    to one with a smaller time; an insn that uses a unit that is more
 667    likely to be used is chosen in preference to one with a unit that
 668    is less used.  We are trying to minimize a subsequent actual
 669    hazard.  The scheduler using only DFA description should never use
 670    the following function.  */
 671
 672 HAIFA_INLINE static int
 673 potential_hazard (unit, insn, cost)
 674      int unit, cost;
 675      rtx insn;
 676 {
 677   int i, ncost;
 678   unsigned int minb, maxb;
 679
 680   if (unit >= 0)
 681     {
 682       minb = maxb = function_units[unit].max_blockage;
 683       if (maxb > 1)
 684         {
 685           if (function_units[unit].blockage_range_function)
 686             {
 687               maxb = minb = blockage_range (unit, insn);
 688               maxb = MAX_BLOCKAGE_COST (maxb);
 689               minb = MIN_BLOCKAGE_COST (minb);
 690             }
 691
 692           if (maxb > 1)
 693             {
 694               /* Make the number of instructions left dominate.  Make the
 695                  minimum delay dominate the maximum delay.  If all these
 696                  are the same, use the unit number to add an arbitrary
 697                  ordering.  Other terms can be added.  */
 698               ncost = minb * 0x40 + maxb;
 699               ncost *= (unit_n_insns[unit] - 1) * 0x1000 + unit;
 700               if (ncost > cost)
 701                 cost = ncost;
 702             }
 703         }
 704     }
 705   else
 706     for (i = 0, unit = ~unit; unit; i++, unit >>= 1)
 707       if ((unit & 1) != 0)
 708         cost = potential_hazard (i, insn, cost);
 709
 710   return cost;
 711 }
 712
 713 /* Compute cost of executing INSN given the dependence LINK on the insn USED.
 714    This is the number of cycles between instruction issue and
 715    instruction results.  */
 716
 717 HAIFA_INLINE int
 718 insn_cost (insn, link, used)
 719      rtx insn, link, used;
 720 {
 721   int cost = INSN_COST (insn);
 722
 723   if (cost < 0)
 724     {
 725       /* A USE insn, or something else we don't need to
 726          understand.  We can't pass these directly to
 727          result_ready_cost or insn_default_latency because it will
 728          trigger a fatal error for unrecognizable insns.  */
 729       if (recog_memoized (insn) < 0)
 730         {
 731           INSN_COST (insn) = 0;
 732           return 0;
 733         }
 734       else
 735         {
 736           if (targetm.sched.use_dfa_pipeline_interface
 737               && (*targetm.sched.use_dfa_pipeline_interface) ())
 738             cost = insn_default_latency (insn);
 739           else
 740             cost = result_ready_cost (insn);
 741
 742           if (cost < 0)
 743             cost = 0;
 744
 745           INSN_COST (insn) = cost;
 746         }
 747     }
 748
 749   /* In this case estimate cost without caring how insn is used.  */
 750   if (link == 0 || used == 0)
 751     return cost;
 752
 753   /* A USE insn should never require the value used to be computed.
 754      This allows the computation of a function's result and parameter
 755      values to overlap the return and call.  */
 756   if (recog_memoized (used) < 0)
 757     cost = 0;
 758   else
 759     {
 760       if (targetm.sched.use_dfa_pipeline_interface
 761           && (*targetm.sched.use_dfa_pipeline_interface) ())
 762         {
 763           if (INSN_CODE (insn) >= 0)
 764             {
 765               if (REG_NOTE_KIND (link) == REG_DEP_ANTI)
 766                 cost = 0;
 767               else if (REG_NOTE_KIND (link) == REG_DEP_OUTPUT)
 768                 {
 769                   cost = (insn_default_latency (insn)
 770                           - insn_default_latency (used));
 771                   if (cost <= 0)
 772                     cost = 1;
 773                 }
 774               else if (bypass_p (insn))
 775                 cost = insn_latency (insn, used);
 776             }
 777         }
 778
 779       if (targetm.sched.adjust_cost)
 780         cost = (*targetm.sched.adjust_cost) (used, link, insn, cost);
 781
 782       if (cost < 0)
 783         cost = 0;
 784     }
 785
 786   return cost;
 787 }
 788
 789 /* Compute the priority number for INSN.  */
 790
 791 static int
 792 priority (insn)
 793      rtx insn;
 794 {
 795   rtx link;
 796
 797   if (! INSN_P (insn))
 798     return 0;
 799
 800   if (! INSN_PRIORITY_KNOWN (insn))
 801     {
 802       int this_priority = 0;
 803
 804       if (INSN_DEPEND (insn) == 0)
 805         this_priority = insn_cost (insn, 0, 0);
 806       else
 807         {
 808           for (link = INSN_DEPEND (insn); link; link = XEXP (link, 1))
 809             {
 810               rtx next;
 811               int next_priority;
 812
 813               if (RTX_INTEGRATED_P (link))
 814                 continue;
 815
 816               next = XEXP (link, 0);
 817
 818               /* Critical path is meaningful in block boundaries only.  */
 819               if (! (*current_sched_info->contributes_to_priority) (next, insn))
 820                 continue;
 821
 822               next_priority = insn_cost (insn, link, next) + priority (next);
 823               if (next_priority > this_priority)
 824                 this_priority = next_priority;
 825             }
 826         }
 827       INSN_PRIORITY (insn) = this_priority;
 828       INSN_PRIORITY_KNOWN (insn) = 1;
 829     }
 830
 831   return INSN_PRIORITY (insn);
 832 }
 833 \f
 834 /* Macros and functions for keeping the priority queue sorted, and
 835    dealing with queueing and dequeueing of instructions.  */
 836
 837 #define SCHED_SORT(READY, N_READY)                                   \
 838 do { if ((N_READY) == 2)                                             \
 839        swap_sort (READY, N_READY);                                   \
 840      else if ((N_READY) > 2)                                         \
 841          qsort (READY, N_READY, sizeof (rtx), rank_for_schedule); }  \
 842 while (0)
 843
 844 /* Returns a positive value if x is preferred; returns a negative value if
 845    y is preferred.  Should never return 0, since that will make the sort
 846    unstable.  */
 847
 848 static int
 849 rank_for_schedule (x, y)
 850      const PTR x;
 851      const PTR y;
 852 {
 853   rtx tmp = *(const rtx *) y;
 854   rtx tmp2 = *(const rtx *) x;
 855   rtx link, lsi;
 856   int tmp_class, tmp2_class, depend_count1, depend_count2;
 857   int val, priority_val, weight_val, info_val;
 858
 859   /* Prefer insn with higher priority.  */
 860   priority_val = INSN_PRIORITY (tmp2) - INSN_PRIORITY (tmp);
 861   if (priority_val)
 862     return priority_val;
 863
 864   /* Prefer an insn with smaller contribution to registers-pressure.  */
 865   if (!reload_completed &&
 866       (weight_val = INSN_REG_WEIGHT (tmp) - INSN_REG_WEIGHT (tmp2)))
 867     return (weight_val);
 868
 869   info_val = (*current_sched_info->rank) (tmp, tmp2);
 870   if (info_val)
 871     return info_val;
 872
 873   /* Compare insns based on their relation to the last-scheduled-insn.  */
 874   for (lsi = last_scheduled_insn;
 875        lsi && INSN_UID (lsi) >= old_max_uid;
 876        lsi = PREV_INSN (lsi))
 877     continue;
 878
 879   if (lsi)
 880     {
 881       /* Classify the instructions into three classes:
 882          1) Data dependent on last schedule insn.
 883          2) Anti/Output dependent on last scheduled insn.
 884          3) Independent of last scheduled insn, or has latency of one.
 885          Choose the insn from the highest numbered class if different.  */
 886       link = find_insn_list (tmp, INSN_DEPEND (lsi));
 887       if (link == 0 || insn_cost (lsi, link, tmp) == 1)
 888         tmp_class = 3;
 889       else if (REG_NOTE_KIND (link) == 0)       /* Data dependence.  */
 890         tmp_class = 1;
 891       else
 892         tmp_class = 2;
 893
 894       link = find_insn_list (tmp2, INSN_DEPEND (lsi));
 895       if (link == 0 || insn_cost (lsi, link, tmp2) == 1)
 896         tmp2_class = 3;
 897       else if (REG_NOTE_KIND (link) == 0)       /* Data dependence.  */
 898         tmp2_class = 1;
 899       else
 900         tmp2_class = 2;
 901
 902       if ((val = tmp2_class - tmp_class))
 903         return val;
 904     }
 905
 906   /* Prefer the insn which has more later insns that depend on it.
 907      This gives the scheduler more freedom when scheduling later
 908      instructions at the expense of added register pressure.  */
 909   depend_count1 = 0;
 910   for (link = INSN_DEPEND (tmp); link; link = XEXP (link, 1))
 911     depend_count1++;
 912
 913   depend_count2 = 0;
 914   for (link = INSN_DEPEND (tmp2); link; link = XEXP (link, 1))
 915     depend_count2++;
 916
 917   val = depend_count2 - depend_count1;
 918   if (val)
 919     return val;
 920
 921   /* If insns are equally good, sort by INSN_LUID (original insn order),
 922      so that we make the sort stable.  This minimizes instruction movement,
 923      thus minimizing sched's effect on debugging and cross-jumping.  */
 924   return INSN_LUID (tmp) - INSN_LUID (tmp2);
 925 }
 926
 927 /* Resort the array A in which only element at index N may be out of order.  */
 928
 929 HAIFA_INLINE static void
 930 swap_sort (a, n)
 931      rtx *a;
 932      int n;
 933 {
 934   rtx insn = a[n - 1];
 935   int i = n - 2;
 936
 937   while (i >= 0 && rank_for_schedule (a + i, &insn) >= 0)
 938     {
 939       a[i + 1] = a[i];
 940       i -= 1;
 941     }
 942   a[i + 1] = insn;
 943 }
 944
 945 /* Add INSN to the insn queue so that it can be executed at least
 946    N_CYCLES after the currently executing insn.  Preserve insns
 947    chain for debugging purposes.  */
 948
 949 HAIFA_INLINE static void
 950 queue_insn (insn, n_cycles)
 951      rtx insn;
 952      int n_cycles;
 953 {
 954   int next_q = NEXT_Q_AFTER (q_ptr, n_cycles);
 955   rtx link = alloc_INSN_LIST (insn, insn_queue[next_q]);
 956   insn_queue[next_q] = link;
 957   q_size += 1;
 958
 959   if (sched_verbose >= 2)
 960     {
 961       fprintf (sched_dump, ";;\t\tReady-->Q: insn %s: ",
 962                (*current_sched_info->print_insn) (insn, 0));
 963
 964       fprintf (sched_dump, "queued for %d cycles.\n", n_cycles);
 965     }
 966 }
 967
 968 /* Return a pointer to the bottom of the ready list, i.e. the insn
 969    with the lowest priority.  */
 970
 971 HAIFA_INLINE static rtx *
 972 ready_lastpos (ready)
 973      struct ready_list *ready;
 974 {
 975   if (ready->n_ready == 0)
 976     abort ();
 977   return ready->vec + ready->first - ready->n_ready + 1;
 978 }
 979
 980 /* Add an element INSN to the ready list so that it ends up with the lowest
 981    priority.  */
 982
 983 HAIFA_INLINE void
 984 ready_add (ready, insn)
 985      struct ready_list *ready;
 986      rtx insn;
 987 {
 988   if (ready->first == ready->n_ready)
 989     {
 990       memmove (ready->vec + ready->veclen - ready->n_ready,
 991                ready_lastpos (ready),
 992                ready->n_ready * sizeof (rtx));
 993       ready->first = ready->veclen - 1;
 994     }
 995   ready->vec[ready->first - ready->n_ready] = insn;
 996   ready->n_ready++;
 997 }
 998
 999 /* Remove the element with the highest priority from the ready list and
1000    return it.  */
1001
1002 HAIFA_INLINE static rtx
1003 ready_remove_first (ready)
1004      struct ready_list *ready;
1005 {
1006   rtx t;
1007   if (ready->n_ready == 0)
1008     abort ();
1009   t = ready->vec[ready->first--];
1010   ready->n_ready--;
1011   /* If the queue becomes empty, reset it.  */
1012   if (ready->n_ready == 0)
1013     ready->first = ready->veclen - 1;
1014   return t;
1015 }
1016
1017 /* The following code implements multi-pass scheduling for the first
1018    cycle.  In other words, we will try to choose ready insn which
1019    permits to start maximum number of insns on the same cycle.  */
1020
1021 /* Return a pointer to the element INDEX from the ready.  INDEX for
1022    insn with the highest priority is 0, and the lowest priority has
1023    N_READY - 1.  */
1024
1025 HAIFA_INLINE static rtx
1026 ready_element (ready, index)
1027      struct ready_list *ready;
1028      int index;
1029 {
1030   if (ready->n_ready == 0 || index >= ready->n_ready)
1031     abort ();
1032   return ready->vec[ready->first - index];
1033 }
1034
1035 /* Remove the element INDEX from the ready list and return it.  INDEX
1036    for insn with the highest priority is 0, and the lowest priority
1037    has N_READY - 1.  */
1038
1039 HAIFA_INLINE static rtx
1040 ready_remove (ready, index)
1041      struct ready_list *ready;
1042      int index;
1043 {
1044   rtx t;
1045   int i;
1046
1047   if (index == 0)
1048     return ready_remove_first (ready);
1049   if (ready->n_ready == 0 || index >= ready->n_ready)
1050     abort ();
1051   t = ready->vec[ready->first - index];
1052   ready->n_ready--;
1053   for (i = index; i < ready->n_ready; i++)
1054     ready->vec[ready->first - i] = ready->vec[ready->first - i - 1];
1055   return t;
1056 }
1057
1058
1059 /* Sort the ready list READY by ascending priority, using the SCHED_SORT
1060    macro.  */
1061
1062 HAIFA_INLINE static void
1063 ready_sort (ready)
1064      struct ready_list *ready;
1065 {
1066   rtx *first = ready_lastpos (ready);
1067   SCHED_SORT (first, ready->n_ready);
1068 }
1069
1070 /* PREV is an insn that is ready to execute.  Adjust its priority if that
1071    will help shorten or lengthen register lifetimes as appropriate.  Also
1072    provide a hook for the target to tweek itself.  */
1073
1074 HAIFA_INLINE static void
1075 adjust_priority (prev)
1076      rtx prev;
1077 {
1078   /* ??? There used to be code here to try and estimate how an insn
1079      affected register lifetimes, but it did it by looking at REG_DEAD
1080      notes, which we removed in schedule_region.  Nor did it try to
1081      take into account register pressure or anything useful like that.
1082
1083      Revisit when we have a machine model to work with and not before.  */
1084
1085   if (targetm.sched.adjust_priority)
1086     INSN_PRIORITY (prev) =
1087       (*targetm.sched.adjust_priority) (prev, INSN_PRIORITY (prev));
1088 }
1089
1090 /* Advance time on one cycle.  */
1091 HAIFA_INLINE static void
1092 advance_one_cycle ()
1093 {
1094   if (targetm.sched.use_dfa_pipeline_interface
1095       && (*targetm.sched.use_dfa_pipeline_interface) ())
1096     {
1097       if (targetm.sched.dfa_pre_cycle_insn)
1098         state_transition (curr_state,
1099                           (*targetm.sched.dfa_pre_cycle_insn) ());
1100
1101       state_transition (curr_state, NULL);
1102
1103       if (targetm.sched.dfa_post_cycle_insn)
1104         state_transition (curr_state,
1105                           (*targetm.sched.dfa_post_cycle_insn) ());
1106     }
1107 }
1108
1109 /* Clock at which the previous instruction was issued.  */
1110 static int last_clock_var;
1111
1112 /* INSN is the "currently executing insn".  Launch each insn which was
1113    waiting on INSN.  READY is the ready list which contains the insns
1114    that are ready to fire.  CLOCK is the current cycle.
1115    */
1116
1117 static void
1118 schedule_insn (insn, ready, clock)
1119      rtx insn;
1120      struct ready_list *ready;
1121      int clock;
1122 {
1123   rtx link;
1124   int unit = 0;
1125
1126   if (!targetm.sched.use_dfa_pipeline_interface
1127       || !(*targetm.sched.use_dfa_pipeline_interface) ())
1128     unit = insn_unit (insn);
1129
1130   if (targetm.sched.use_dfa_pipeline_interface
1131       && (*targetm.sched.use_dfa_pipeline_interface) ()
1132       && sched_verbose >= 1)
1133     {
1134       char buf[2048];
1135
1136       print_insn (buf, insn, 0);
1137       buf[40]=0;
1138       fprintf (sched_dump, ";;\t%3i--> %-40s:", clock, buf);
1139
1140       if (recog_memoized (insn) < 0)
1141         fprintf (sched_dump, "nothing");
1142       else
1143         print_reservation (sched_dump, insn);
1144       fputc ('\n', sched_dump);
1145     }
1146   else if (sched_verbose >= 2)
1147     {
1148       fprintf (sched_dump, ";;\t\t--> scheduling insn <<<%d>>> on unit ",
1149                INSN_UID (insn));
1150       insn_print_units (insn);
1151       fputc ('\n', sched_dump);
1152     }
1153
1154   if (!targetm.sched.use_dfa_pipeline_interface
1155       || !(*targetm.sched.use_dfa_pipeline_interface) ())
1156     {
1157       if (sched_verbose && unit == -1)
1158         visualize_no_unit (insn);
1159
1160
1161       if (MAX_BLOCKAGE > 1 || issue_rate > 1 || sched_verbose)
1162         schedule_unit (unit, insn, clock);
1163
1164       if (INSN_DEPEND (insn) == 0)
1165         return;
1166     }
1167
1168   for (link = INSN_DEPEND (insn); link != 0; link = XEXP (link, 1))
1169     {
1170       rtx next = XEXP (link, 0);
1171       int cost = insn_cost (insn, link, next);
1172
1173       INSN_TICK (next) = MAX (INSN_TICK (next), clock + cost);
1174
1175       if ((INSN_DEP_COUNT (next) -= 1) == 0)
1176         {
1177           int effective_cost = INSN_TICK (next) - clock;
1178
1179           if (! (*current_sched_info->new_ready) (next))
1180             continue;
1181
1182           if (sched_verbose >= 2)
1183             {
1184               fprintf (sched_dump, ";;\t\tdependences resolved: insn %s ",
1185                        (*current_sched_info->print_insn) (next, 0));
1186
1187               if (effective_cost < 1)
1188                 fprintf (sched_dump, "into ready\n");
1189               else
1190                 fprintf (sched_dump, "into queue with cost=%d\n", effective_cost);
1191             }
1192
1193           /* Adjust the priority of NEXT and either put it on the ready
1194              list or queue it.  */
1195           adjust_priority (next);
1196           if (effective_cost < 1)
1197             ready_add (ready, next);
1198           else
1199             queue_insn (next, effective_cost);
1200         }
1201     }
1202
1203   /* Annotate the instruction with issue information -- TImode
1204      indicates that the instruction is expected not to be able
1205      to issue on the same cycle as the previous insn.  A machine
1206      may use this information to decide how the instruction should
1207      be aligned.  */
1208   if (reload_completed && issue_rate > 1
1209       && GET_CODE (PATTERN (insn)) != USE
1210       && GET_CODE (PATTERN (insn)) != CLOBBER)
1211     {
1212       PUT_MODE (insn, clock > last_clock_var ? TImode : VOIDmode);
1213       last_clock_var = clock;
1214     }
1215 }
1216
1217 /* Functions for handling of notes.  */
1218
1219 /* Delete notes beginning with INSN and put them in the chain
1220    of notes ended by NOTE_LIST.
1221    Returns the insn following the notes.  */
1222
1223 static rtx
1224 unlink_other_notes (insn, tail)
1225      rtx insn, tail;
1226 {
1227   rtx prev = PREV_INSN (insn);
1228
1229   while (insn != tail && GET_CODE (insn) == NOTE)
1230     {
1231       rtx next = NEXT_INSN (insn);
1232       /* Delete the note from its current position.  */
1233       if (prev)
1234         NEXT_INSN (prev) = next;
1235       if (next)
1236         PREV_INSN (next) = prev;
1237
1238       /* See sched_analyze to see how these are handled.  */
1239       if (NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG
1240           && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_END
1241           && NOTE_LINE_NUMBER (insn) != NOTE_INSN_RANGE_BEG
1242           && NOTE_LINE_NUMBER (insn) != NOTE_INSN_RANGE_END
1243           && NOTE_LINE_NUMBER (insn) != NOTE_INSN_EH_REGION_BEG
1244           && NOTE_LINE_NUMBER (insn) != NOTE_INSN_EH_REGION_END)
1245         {
1246           /* Insert the note at the end of the notes list.  */
1247           PREV_INSN (insn) = note_list;
1248           if (note_list)
1249             NEXT_INSN (note_list) = insn;
1250           note_list = insn;
1251         }
1252
1253       insn = next;
1254     }
1255   return insn;
1256 }
1257
1258 /* Delete line notes beginning with INSN. Record line-number notes so
1259    they can be reused.  Returns the insn following the notes.  */
1260
1261 static rtx
1262 unlink_line_notes (insn, tail)
1263      rtx insn, tail;
1264 {
1265   rtx prev = PREV_INSN (insn);
1266
1267   while (insn != tail && GET_CODE (insn) == NOTE)
1268     {
1269       rtx next = NEXT_INSN (insn);
1270
1271       if (write_symbols != NO_DEBUG && NOTE_LINE_NUMBER (insn) > 0)
1272         {
1273           /* Delete the note from its current position.  */
1274           if (prev)
1275             NEXT_INSN (prev) = next;
1276           if (next)
1277             PREV_INSN (next) = prev;
1278
1279           /* Record line-number notes so they can be reused.  */
1280           LINE_NOTE (insn) = insn;
1281         }
1282       else
1283         prev = insn;
1284
1285       insn = next;
1286     }
1287   return insn;
1288 }
1289
1290 /* Return the head and tail pointers of BB.  */
1291
1292 void
1293 get_block_head_tail (b, headp, tailp)
1294      int b;
1295      rtx *headp;
1296      rtx *tailp;
1297 {
1298   /* HEAD and TAIL delimit the basic block being scheduled.  */
1299   rtx head = BLOCK_HEAD (b);
1300   rtx tail = BLOCK_END (b);
1301
1302   /* Don't include any notes or labels at the beginning of the
1303      basic block, or notes at the ends of basic blocks.  */
1304   while (head != tail)
1305     {
1306       if (GET_CODE (head) == NOTE)
1307         head = NEXT_INSN (head);
1308       else if (GET_CODE (tail) == NOTE)
1309         tail = PREV_INSN (tail);
1310       else if (GET_CODE (head) == CODE_LABEL)
1311         head = NEXT_INSN (head);
1312       else
1313         break;
1314     }
1315
1316   *headp = head;
1317   *tailp = tail;
1318 }
1319
1320 /* Return nonzero if there are no real insns in the range [ HEAD, TAIL ].  */
1321
1322 int
1323 no_real_insns_p (head, tail)
1324      rtx head, tail;
1325 {
1326   while (head != NEXT_INSN (tail))
1327     {
1328       if (GET_CODE (head) != NOTE && GET_CODE (head) != CODE_LABEL)
1329         return 0;
1330       head = NEXT_INSN (head);
1331     }
1332   return 1;
1333 }
1334
1335 /* Delete line notes from one block. Save them so they can be later restored
1336    (in restore_line_notes).  HEAD and TAIL are the boundaries of the
1337    block in which notes should be processed.  */
1338
1339 void
1340 rm_line_notes (head, tail)
1341      rtx head, tail;
1342 {
1343   rtx next_tail;
1344   rtx insn;
1345
1346   next_tail = NEXT_INSN (tail);
1347   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1348     {
1349       rtx prev;
1350
1351       /* Farm out notes, and maybe save them in NOTE_LIST.
1352          This is needed to keep the debugger from
1353          getting completely deranged.  */
1354       if (GET_CODE (insn) == NOTE)
1355         {
1356           prev = insn;
1357           insn = unlink_line_notes (insn, next_tail);
1358
1359           if (prev == tail)
1360             abort ();
1361           if (prev == head)
1362             abort ();
1363           if (insn == next_tail)
1364             abort ();
1365         }
1366     }
1367 }
1368
1369 /* Save line number notes for each insn in block B.  HEAD and TAIL are
1370    the boundaries of the block in which notes should be processed.  */
1371
1372 void
1373 save_line_notes (b, head, tail)
1374      int b;
1375      rtx head, tail;
1376 {
1377   rtx next_tail;
1378
1379   /* We must use the true line number for the first insn in the block
1380      that was computed and saved at the start of this pass.  We can't
1381      use the current line number, because scheduling of the previous
1382      block may have changed the current line number.  */
1383
1384   rtx line = line_note_head[b];
1385   rtx insn;
1386
1387   next_tail = NEXT_INSN (tail);
1388
1389   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1390     if (GET_CODE (insn) == NOTE && NOTE_LINE_NUMBER (insn) > 0)
1391       line = insn;
1392     else
1393       LINE_NOTE (insn) = line;
1394 }
1395
1396 /* After a block was scheduled, insert line notes into the insns list.
1397    HEAD and TAIL are the boundaries of the block in which notes should
1398    be processed.  */
1399
1400 void
1401 restore_line_notes (head, tail)
1402      rtx head, tail;
1403 {
1404   rtx line, note, prev, new;
1405   int added_notes = 0;
1406   rtx next_tail, insn;
1407
1408   head = head;
1409   next_tail = NEXT_INSN (tail);
1410
1411   /* Determine the current line-number.  We want to know the current
1412      line number of the first insn of the block here, in case it is
1413      different from the true line number that was saved earlier.  If
1414      different, then we need a line number note before the first insn
1415      of this block.  If it happens to be the same, then we don't want to
1416      emit another line number note here.  */
1417   for (line = head; line; line = PREV_INSN (line))
1418     if (GET_CODE (line) == NOTE && NOTE_LINE_NUMBER (line) > 0)
1419       break;
1420
1421   /* Walk the insns keeping track of the current line-number and inserting
1422      the line-number notes as needed.  */
1423   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1424     if (GET_CODE (insn) == NOTE && NOTE_LINE_NUMBER (insn) > 0)
1425       line = insn;
1426   /* This used to emit line number notes before every non-deleted note.
1427      However, this confuses a debugger, because line notes not separated
1428      by real instructions all end up at the same address.  I can find no
1429      use for line number notes before other notes, so none are emitted.  */
1430     else if (GET_CODE (insn) != NOTE
1431              && INSN_UID (insn) < old_max_uid
1432              && (note = LINE_NOTE (insn)) != 0
1433              && note != line
1434              && (line == 0
1435                  || NOTE_LINE_NUMBER (note) != NOTE_LINE_NUMBER (line)
1436                  || NOTE_SOURCE_FILE (note) != NOTE_SOURCE_FILE (line)))
1437       {
1438         line = note;
1439         prev = PREV_INSN (insn);
1440         if (LINE_NOTE (note))
1441           {
1442             /* Re-use the original line-number note.  */
1443             LINE_NOTE (note) = 0;
1444             PREV_INSN (note) = prev;
1445             NEXT_INSN (prev) = note;
1446             PREV_INSN (insn) = note;
1447             NEXT_INSN (note) = insn;
1448           }
1449         else
1450           {
1451             added_notes++;
1452             new = emit_note_after (NOTE_LINE_NUMBER (note), prev);
1453             NOTE_SOURCE_FILE (new) = NOTE_SOURCE_FILE (note);
1454             RTX_INTEGRATED_P (new) = RTX_INTEGRATED_P (note);
1455           }
1456       }
1457   if (sched_verbose && added_notes)
1458     fprintf (sched_dump, ";; added %d line-number notes\n", added_notes);
1459 }
1460
1461 /* After scheduling the function, delete redundant line notes from the
1462    insns list.  */
1463
1464 void
1465 rm_redundant_line_notes ()
1466 {
1467   rtx line = 0;
1468   rtx insn = get_insns ();
1469   int active_insn = 0;
1470   int notes = 0;
1471
1472   /* Walk the insns deleting redundant line-number notes.  Many of these
1473      are already present.  The remainder tend to occur at basic
1474      block boundaries.  */
1475   for (insn = get_last_insn (); insn; insn = PREV_INSN (insn))
1476     if (GET_CODE (insn) == NOTE && NOTE_LINE_NUMBER (insn) > 0)
1477       {
1478         /* If there are no active insns following, INSN is redundant.  */
1479         if (active_insn == 0)
1480           {
1481             notes++;
1482             NOTE_SOURCE_FILE (insn) = 0;
1483             NOTE_LINE_NUMBER (insn) = NOTE_INSN_DELETED;
1484           }
1485         /* If the line number is unchanged, LINE is redundant.  */
1486         else if (line
1487                  && NOTE_LINE_NUMBER (line) == NOTE_LINE_NUMBER (insn)
1488                  && NOTE_SOURCE_FILE (line) == NOTE_SOURCE_FILE (insn))
1489           {
1490             notes++;
1491             NOTE_SOURCE_FILE (line) = 0;
1492             NOTE_LINE_NUMBER (line) = NOTE_INSN_DELETED;
1493             line = insn;
1494           }
1495         else
1496           line = insn;
1497         active_insn = 0;
1498       }
1499     else if (!((GET_CODE (insn) == NOTE
1500                 && NOTE_LINE_NUMBER (insn) == NOTE_INSN_DELETED)
1501                || (GET_CODE (insn) == INSN
1502                    && (GET_CODE (PATTERN (insn)) == USE
1503                        || GET_CODE (PATTERN (insn)) == CLOBBER))))
1504       active_insn++;
1505
1506   if (sched_verbose && notes)
1507     fprintf (sched_dump, ";; deleted %d line-number notes\n", notes);
1508 }
1509
1510 /* Delete notes between HEAD and TAIL and put them in the chain
1511    of notes ended by NOTE_LIST.  */
1512
1513 void
1514 rm_other_notes (head, tail)
1515      rtx head;
1516      rtx tail;
1517 {
1518   rtx next_tail;
1519   rtx insn;
1520
1521   note_list = 0;
1522   if (head == tail && (! INSN_P (head)))
1523     return;
1524
1525   next_tail = NEXT_INSN (tail);
1526   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1527     {
1528       rtx prev;
1529
1530       /* Farm out notes, and maybe save them in NOTE_LIST.
1531          This is needed to keep the debugger from
1532          getting completely deranged.  */
1533       if (GET_CODE (insn) == NOTE)
1534         {
1535           prev = insn;
1536
1537           insn = unlink_other_notes (insn, next_tail);
1538
1539           if (prev == tail)
1540             abort ();
1541           if (prev == head)
1542             abort ();
1543           if (insn == next_tail)
1544             abort ();
1545         }
1546     }
1547 }
1548
1549 /* Functions for computation of registers live/usage info.  */
1550
1551 /* Calculate INSN_REG_WEIGHT for all insns of a block.  */
1552
1553 static void
1554 find_insn_reg_weight (b)
1555      int b;
1556 {
1557   rtx insn, next_tail, head, tail;
1558
1559   get_block_head_tail (b, &head, &tail);
1560   next_tail = NEXT_INSN (tail);
1561
1562   for (insn = head; insn != next_tail; insn = NEXT_INSN (insn))
1563     {
1564       int reg_weight = 0;
1565       rtx x;
1566
1567       /* Handle register life information.  */
1568       if (! INSN_P (insn))
1569         continue;
1570
1571       /* Increment weight for each register born here.  */
1572       x = PATTERN (insn);
1573       if ((GET_CODE (x) == SET || GET_CODE (x) == CLOBBER)
1574           && register_operand (SET_DEST (x), VOIDmode))
1575         reg_weight++;
1576       else if (GET_CODE (x) == PARALLEL)
1577         {
1578           int j;
1579           for (j = XVECLEN (x, 0) - 1; j >= 0; j--)
1580             {
1581               x = XVECEXP (PATTERN (insn), 0, j);
1582               if ((GET_CODE (x) == SET || GET_CODE (x) == CLOBBER)
1583                   && register_operand (SET_DEST (x), VOIDmode))
1584                 reg_weight++;
1585             }
1586         }
1587
1588       /* Decrement weight for each register that dies here.  */
1589       for (x = REG_NOTES (insn); x; x = XEXP (x, 1))
1590         {
1591           if (REG_NOTE_KIND (x) == REG_DEAD
1592               || REG_NOTE_KIND (x) == REG_UNUSED)
1593             reg_weight--;
1594         }
1595
1596       INSN_REG_WEIGHT (insn) = reg_weight;
1597     }
1598 }
1599
1600 /* Scheduling clock, modified in schedule_block() and queue_to_ready ().  */
1601 static int clock_var;
1602
1603 /* Move insns that became ready to fire from queue to ready list.  */
1604
1605 static void
1606 queue_to_ready (ready)
1607      struct ready_list *ready;
1608 {
1609   rtx insn;
1610   rtx link;
1611
1612   q_ptr = NEXT_Q (q_ptr);
1613
1614   /* Add all pending insns that can be scheduled without stalls to the
1615      ready list.  */
1616   for (link = insn_queue[q_ptr]; link; link = XEXP (link, 1))
1617     {
1618       insn = XEXP (link, 0);
1619       q_size -= 1;
1620
1621       if (sched_verbose >= 2)
1622         fprintf (sched_dump, ";;\t\tQ-->Ready: insn %s: ",
1623                  (*current_sched_info->print_insn) (insn, 0));
1624
1625       ready_add (ready, insn);
1626       if (sched_verbose >= 2)
1627         fprintf (sched_dump, "moving to ready without stalls\n");
1628     }
1629   insn_queue[q_ptr] = 0;
1630
1631   /* If there are no ready insns, stall until one is ready and add all
1632      of the pending insns at that point to the ready list.  */
1633   if (ready->n_ready == 0)
1634     {
1635       int stalls;
1636
1637       for (stalls = 1; stalls <= MAX_INSN_QUEUE_INDEX; stalls++)
1638         {
1639           if ((link = insn_queue[NEXT_Q_AFTER (q_ptr, stalls)]))
1640             {
1641               for (; link; link = XEXP (link, 1))
1642                 {
1643                   insn = XEXP (link, 0);
1644                   q_size -= 1;
1645
1646                   if (sched_verbose >= 2)
1647                     fprintf (sched_dump, ";;\t\tQ-->Ready: insn %s: ",
1648                              (*current_sched_info->print_insn) (insn, 0));
1649
1650                   ready_add (ready, insn);
1651                   if (sched_verbose >= 2)
1652                     fprintf (sched_dump, "moving to ready with %d stalls\n", stalls);
1653                 }
1654               insn_queue[NEXT_Q_AFTER (q_ptr, stalls)] = 0;
1655
1656               advance_one_cycle ();
1657
1658               break;
1659             }
1660
1661           advance_one_cycle ();
1662         }
1663
1664       if ((!targetm.sched.use_dfa_pipeline_interface
1665            || !(*targetm.sched.use_dfa_pipeline_interface) ())
1666           && sched_verbose && stalls)
1667         visualize_stall_cycles (stalls);
1668
1669       q_ptr = NEXT_Q_AFTER (q_ptr, stalls);
1670       clock_var += stalls;
1671     }
1672 }
1673
1674 /* Print the ready list for debugging purposes.  Callable from debugger.  */
1675
1676 static void
1677 debug_ready_list (ready)
1678      struct ready_list *ready;
1679 {
1680   rtx *p;
1681   int i;
1682
1683   if (ready->n_ready == 0)
1684     {
1685       fprintf (sched_dump, "\n");
1686       return;
1687     }
1688
1689   p = ready_lastpos (ready);
1690   for (i = 0; i < ready->n_ready; i++)
1691     fprintf (sched_dump, "  %s", (*current_sched_info->print_insn) (p[i], 0));
1692   fprintf (sched_dump, "\n");
1693 }
1694
1695 /* move_insn1: Remove INSN from insn chain, and link it after LAST insn.  */
1696
1697 static rtx
1698 move_insn1 (insn, last)
1699      rtx insn, last;
1700 {
1701   NEXT_INSN (PREV_INSN (insn)) = NEXT_INSN (insn);
1702   PREV_INSN (NEXT_INSN (insn)) = PREV_INSN (insn);
1703
1704   NEXT_INSN (insn) = NEXT_INSN (last);
1705   PREV_INSN (NEXT_INSN (last)) = insn;
1706
1707   NEXT_INSN (last) = insn;
1708   PREV_INSN (insn) = last;
1709
1710   return insn;
1711 }
1712
1713 /* Search INSN for REG_SAVE_NOTE note pairs for
1714    NOTE_INSN_{LOOP,EHREGION}_{BEG,END}; and convert them back into
1715    NOTEs.  The REG_SAVE_NOTE note following first one is contains the
1716    saved value for NOTE_BLOCK_NUMBER which is useful for
1717    NOTE_INSN_EH_REGION_{BEG,END} NOTEs.  LAST is the last instruction
1718    output by the instruction scheduler.  Return the new value of LAST.  */
1719
1720 static rtx
1721 reemit_notes (insn, last)
1722      rtx insn;
1723      rtx last;
1724 {
1725   rtx note, retval;
1726
1727   retval = last;
1728   for (note = REG_NOTES (insn); note; note = XEXP (note, 1))
1729     {
1730       if (REG_NOTE_KIND (note) == REG_SAVE_NOTE)
1731         {
1732           enum insn_note note_type = INTVAL (XEXP (note, 0));
1733
1734           if (note_type == NOTE_INSN_RANGE_BEG
1735               || note_type == NOTE_INSN_RANGE_END)
1736             {
1737               last = emit_note_before (note_type, last);
1738               remove_note (insn, note);
1739               note = XEXP (note, 1);
1740               NOTE_RANGE_INFO (last) = XEXP (note, 0);
1741             }
1742           else
1743             {
1744               last = emit_note_before (note_type, last);
1745               remove_note (insn, note);
1746               note = XEXP (note, 1);
1747               if (note_type == NOTE_INSN_EH_REGION_BEG
1748                   || note_type == NOTE_INSN_EH_REGION_END)
1749                 NOTE_EH_HANDLER (last) = INTVAL (XEXP (note, 0));
1750             }
1751           remove_note (insn, note);
1752         }
1753     }
1754   return retval;
1755 }
1756
1757 /* Move INSN, and all insns which should be issued before it,
1758    due to SCHED_GROUP_P flag.  Reemit notes if needed.
1759
1760    Return the last insn emitted by the scheduler, which is the
1761    return value from the first call to reemit_notes.  */
1762
1763 static rtx
1764 move_insn (insn, last)
1765      rtx insn, last;
1766 {
1767   rtx retval = NULL;
1768
1769   /* If INSN has SCHED_GROUP_P set, then issue it and any other
1770      insns with SCHED_GROUP_P set first.  */
1771   while (SCHED_GROUP_P (insn))
1772     {
1773       rtx prev = PREV_INSN (insn);
1774
1775       /* Move a SCHED_GROUP_P insn.  */
1776       move_insn1 (insn, last);
1777       /* If this is the first call to reemit_notes, then record
1778          its return value.  */
1779       if (retval == NULL_RTX)
1780         retval = reemit_notes (insn, insn);
1781       else
1782         reemit_notes (insn, insn);
1783       insn = prev;
1784     }
1785
1786   /* Now move the first non SCHED_GROUP_P insn.  */
1787   move_insn1 (insn, last);
1788
1789   /* If this is the first call to reemit_notes, then record
1790      its return value.  */
1791   if (retval == NULL_RTX)
1792     retval = reemit_notes (insn, insn);
1793   else
1794     reemit_notes (insn, insn);
1795
1796   return retval;
1797 }
1798
1799 /* The following function returns maximal (or close to maximal) number
1800    of insns which can be issued on the same cycle and one of which
1801    insns is insns with the best rank (the last insn in READY).  To
1802    make this function tries different samples of ready insns.  READY
1803    is current queue `ready'.  Global array READY_TRY reflects what
1804    insns are already issued in this try.  STATE is current processor
1805    state.  If the function returns nonzero, INDEX will contain index
1806    of the best insn in READY.  The following function is used only for
1807    first cycle multipass scheduling.  */
1808
1809 static int
1810 max_issue (ready, state, index)
1811      struct ready_list *ready;
1812      state_t state;
1813      int *index;
1814 {
1815   int i, best, n, temp_index, delay;
1816   state_t temp_state;
1817   rtx insn;
1818   int max_lookahead = (*targetm.sched.first_cycle_multipass_dfa_lookahead) ();
1819
1820   if (state_dead_lock_p (state))
1821     return 0;
1822
1823   temp_state = alloca (dfa_state_size);
1824   best = 0;
1825
1826   for (i = 0; i < ready->n_ready; i++)
1827     if (!ready_try [i])
1828       {
1829         insn = ready_element (ready, i);
1830
1831         if (INSN_CODE (insn) < 0)
1832           continue;
1833
1834         memcpy (temp_state, state, dfa_state_size);
1835
1836         delay = state_transition (temp_state, insn);
1837
1838         if (delay == 0)
1839           {
1840             if (!targetm.sched.dfa_bubble)
1841               continue;
1842             else
1843               {
1844                 int j;
1845                 rtx bubble;
1846
1847                 for (j = 0;
1848                      (bubble = (*targetm.sched.dfa_bubble) (j)) != NULL_RTX;
1849                      j++)
1850                   if (state_transition (temp_state, bubble) < 0
1851                       && state_transition (temp_state, insn) < 0)
1852                     break;
1853
1854                 if (bubble == NULL_RTX)
1855                   continue;
1856               }
1857           }
1858         else if (delay > 0)
1859           continue;
1860
1861         --max_lookahead;
1862
1863         if (max_lookahead < 0)
1864           break;
1865
1866         ready_try [i] = 1;
1867
1868         n = max_issue (ready, temp_state, &temp_index);
1869         if (n > 0 || ready_try[0])
1870           n += 1;
1871
1872         if (best < n)
1873           {
1874             best = n;
1875             *index = i;
1876           }
1877         ready_try [i] = 0;
1878       }
1879
1880   return best;
1881 }
1882
1883 /* The following function chooses insn from READY and modifies
1884    *N_READY and READY.  The following function is used only for first
1885    cycle multipass scheduling.  */
1886
1887 static rtx
1888 choose_ready (ready)
1889      struct ready_list *ready;
1890 {
1891   if (!targetm.sched.first_cycle_multipass_dfa_lookahead
1892       || (*targetm.sched.first_cycle_multipass_dfa_lookahead) () <= 0)
1893     return ready_remove_first (ready);
1894   else
1895     {
1896       /* Try to choose the better insn.  */
1897       int index;
1898
1899       if (max_issue (ready, curr_state, &index) == 0)
1900         return ready_remove_first (ready);
1901       else
1902         return ready_remove (ready, index);
1903     }
1904 }
1905
1906 /* Called from backends from targetm.sched.reorder to emit stuff into
1907    the instruction stream.  */
1908
1909 rtx
1910 sched_emit_insn (pat)
1911      rtx pat;
1912 {
1913   rtx insn = emit_insn_after (pat, last_scheduled_insn);
1914   last_scheduled_insn = insn;
1915   return insn;
1916 }
1917
1918 /* Use forward list scheduling to rearrange insns of block B in region RGN,
1919    possibly bringing insns from subsequent blocks in the same region.  */
1920
1921 void
1922 schedule_block (b, rgn_n_insns)
1923      int b;
1924      int rgn_n_insns;
1925 {
1926   struct ready_list ready;
1927   int first_cycle_insn_p;
1928   int can_issue_more;
1929   state_t temp_state = NULL;  /* It is used for multipass scheduling.  */
1930
1931   /* Head/tail info for this block.  */
1932   rtx prev_head = current_sched_info->prev_head;
1933   rtx next_tail = current_sched_info->next_tail;
1934   rtx head = NEXT_INSN (prev_head);
1935   rtx tail = PREV_INSN (next_tail);
1936
1937   /* We used to have code to avoid getting parameters moved from hard
1938      argument registers into pseudos.
1939
1940      However, it was removed when it proved to be of marginal benefit
1941      and caused problems because schedule_block and compute_forward_dependences
1942      had different notions of what the "head" insn was.  */
1943
1944   if (head == tail && (! INSN_P (head)))
1945     abort ();
1946
1947   /* Debug info.  */
1948   if (sched_verbose)
1949     {
1950       fprintf (sched_dump, ";;   ======================================================\n");
1951       fprintf (sched_dump,
1952                ";;   -- basic block %d from %d to %d -- %s reload\n",
1953                b, INSN_UID (head), INSN_UID (tail),
1954                (reload_completed ? "after" : "before"));
1955       fprintf (sched_dump, ";;   ======================================================\n");
1956       fprintf (sched_dump, "\n");
1957
1958       visualize_alloc ();
1959       init_block_visualization ();
1960     }
1961
1962   if (targetm.sched.use_dfa_pipeline_interface
1963       && (*targetm.sched.use_dfa_pipeline_interface) ())
1964     state_reset (curr_state);
1965   else
1966     clear_units ();
1967
1968   /* Allocate the ready list.  */
1969   ready.veclen = rgn_n_insns + 1 + issue_rate;
1970   ready.first = ready.veclen - 1;
1971   ready.vec = (rtx *) xmalloc (ready.veclen * sizeof (rtx));
1972   ready.n_ready = 0;
1973
1974   if (targetm.sched.use_dfa_pipeline_interface
1975       && (*targetm.sched.use_dfa_pipeline_interface) ())
1976     {
1977       /* It is used for first cycle multipass scheduling.  */
1978       temp_state = alloca (dfa_state_size);
1979       ready_try = (char *) xmalloc ((rgn_n_insns + 1) * sizeof (char));
1980       memset (ready_try, 0, (rgn_n_insns + 1) * sizeof (char));
1981     }
1982
1983   (*current_sched_info->init_ready_list) (&ready);
1984
1985   if (targetm.sched.md_init)
1986     (*targetm.sched.md_init) (sched_dump, sched_verbose, ready.veclen);
1987
1988   /* We start inserting insns after PREV_HEAD.  */
1989   last_scheduled_insn = prev_head;
1990
1991   /* Initialize INSN_QUEUE.  Q_SIZE is the total number of insns in the
1992      queue.  */
1993   q_ptr = 0;
1994   q_size = 0;
1995
1996   if (!targetm.sched.use_dfa_pipeline_interface
1997       || !(*targetm.sched.use_dfa_pipeline_interface) ())
1998     max_insn_queue_index_macro_value = INSN_QUEUE_SIZE - 1;
1999   else
2000     max_insn_queue_index_macro_value = max_insn_queue_index;
2001
2002   insn_queue = (rtx *) alloca ((MAX_INSN_QUEUE_INDEX + 1) * sizeof (rtx));
2003   memset ((char *) insn_queue, 0, (MAX_INSN_QUEUE_INDEX + 1) * sizeof (rtx));
2004   last_clock_var = -1;
2005
2006   /* Start just before the beginning of time.  */
2007   clock_var = -1;
2008
2009   /* Loop until all the insns in BB are scheduled.  */
2010   while ((*current_sched_info->schedule_more_p) ())
2011     {
2012       clock_var++;
2013
2014       advance_one_cycle ();
2015
2016       /* Add to the ready list all pending insns that can be issued now.
2017          If there are no ready insns, increment clock until one
2018          is ready and add all pending insns at that point to the ready
2019          list.  */
2020       queue_to_ready (&ready);
2021
2022       if (sched_verbose && targetm.sched.cycle_display)
2023         last_scheduled_insn
2024           = (*targetm.sched.cycle_display) (clock_var, last_scheduled_insn);
2025
2026       if (ready.n_ready == 0)
2027         abort ();
2028
2029       if (sched_verbose >= 2)
2030         {
2031           fprintf (sched_dump, ";;\t\tReady list after queue_to_ready:  ");
2032           debug_ready_list (&ready);
2033         }
2034
2035       /* Sort the ready list based on priority.  */
2036       ready_sort (&ready);
2037
2038       /* Allow the target to reorder the list, typically for
2039          better instruction bundling.  */
2040       if (targetm.sched.reorder)
2041         can_issue_more =
2042           (*targetm.sched.reorder) (sched_dump, sched_verbose,
2043                                     ready_lastpos (&ready),
2044                                     &ready.n_ready, clock_var);
2045       else
2046         can_issue_more = issue_rate;
2047
2048       first_cycle_insn_p = 1;
2049       for (;;)
2050         {
2051           rtx insn;
2052           int cost;
2053
2054           if (sched_verbose >= 2)
2055             {
2056               fprintf (sched_dump, ";;\tReady list (t =%3d):  ",
2057                        clock_var);
2058               debug_ready_list (&ready);
2059             }
2060
2061           if (!targetm.sched.use_dfa_pipeline_interface
2062               || !(*targetm.sched.use_dfa_pipeline_interface) ())
2063             {
2064               if (ready.n_ready == 0 || !can_issue_more
2065                   || !(*current_sched_info->schedule_more_p) ())
2066                 break;
2067               insn = choose_ready (&ready);
2068               cost = actual_hazard (insn_unit (insn), insn, clock_var, 0);
2069             }
2070           else
2071             {
2072               if (ready.n_ready == 0 || !can_issue_more
2073                   || state_dead_lock_p (curr_state)
2074                   || !(*current_sched_info->schedule_more_p) ())
2075                 break;
2076
2077               /* Select and remove the insn from the ready list.  */
2078               insn = choose_ready (&ready);
2079
2080               memcpy (temp_state, curr_state, dfa_state_size);
2081               if (recog_memoized (insn) < 0)
2082                 {
2083                   if (!first_cycle_insn_p
2084                       && (GET_CODE (PATTERN (insn)) == ASM_INPUT
2085                           || asm_noperands (PATTERN (insn)) >= 0))
2086                     /* This is asm insn which is tryed to be issued on the
2087                        cycle not first.  Issue it on the next cycle.  */
2088                     cost = 1;
2089                   else
2090                     /* A USE insn, or something else we don't need to
2091                        understand.  We can't pass these directly to
2092                        state_transition because it will trigger a
2093                        fatal error for unrecognizable insns.  */
2094                     cost = 0;
2095                 }
2096               else
2097                 {
2098                   cost = state_transition (temp_state, insn);
2099
2100                   if (targetm.sched.first_cycle_multipass_dfa_lookahead
2101                       && targetm.sched.dfa_bubble)
2102                     {
2103                       if (cost == 0)
2104                         {
2105                           int j;
2106                           rtx bubble;
2107
2108                           for (j = 0;
2109                                (bubble = (*targetm.sched.dfa_bubble) (j))
2110                                  != NULL_RTX;
2111                                j++)
2112                             {
2113                               memcpy (temp_state, curr_state, dfa_state_size);
2114
2115                               if (state_transition (temp_state, bubble) < 0
2116                                   && state_transition (temp_state, insn) < 0)
2117                                 break;
2118                             }
2119
2120                           if (bubble != NULL_RTX)
2121                             {
2122                               if (insert_schedule_bubbles_p)
2123                                 {
2124                                   rtx copy;
2125
2126                                   copy = copy_rtx (PATTERN (bubble));
2127                                   emit_insn_after (copy, last_scheduled_insn);
2128                                   last_scheduled_insn
2129                                     = NEXT_INSN (last_scheduled_insn);
2130                                   INSN_CODE (last_scheduled_insn)
2131                                     = INSN_CODE (bubble);
2132
2133                                   /* Annotate the same for the first insns
2134                                      scheduling by using mode.  */
2135                                   PUT_MODE (last_scheduled_insn,
2136                                             (clock_var > last_clock_var
2137                                              ? clock_var - last_clock_var
2138                                              : VOIDmode));
2139                                   last_clock_var = clock_var;
2140
2141                                   if (sched_verbose >= 2)
2142                                     {
2143                                       fprintf (sched_dump,
2144                                                ";;\t\t--> scheduling bubble insn <<<%d>>>:reservation ",
2145                                                INSN_UID (last_scheduled_insn));
2146
2147                                       if (recog_memoized (last_scheduled_insn)
2148                                           < 0)
2149                                         fprintf (sched_dump, "nothing");
2150                                       else
2151                                         print_reservation
2152                                           (sched_dump, last_scheduled_insn);
2153
2154                                       fprintf (sched_dump, "\n");
2155                                     }
2156                                 }
2157                               cost = -1;
2158                             }
2159                         }
2160                     }
2161
2162                   if (cost < 0)
2163                     cost = 0;
2164                   else if (cost == 0)
2165                     cost = 1;
2166                 }
2167             }
2168
2169
2170           if (cost >= 1)
2171             {
2172               queue_insn (insn, cost);
2173               continue;
2174             }
2175
2176           if (! (*current_sched_info->can_schedule_ready_p) (insn))
2177             goto next;
2178
2179           last_scheduled_insn = move_insn (insn, last_scheduled_insn);
2180
2181           if (targetm.sched.use_dfa_pipeline_interface
2182               && (*targetm.sched.use_dfa_pipeline_interface) ())
2183             memcpy (curr_state, temp_state, dfa_state_size);
2184
2185           if (targetm.sched.variable_issue)
2186             can_issue_more =
2187               (*targetm.sched.variable_issue) (sched_dump, sched_verbose,
2188                                                insn, can_issue_more);
2189           else
2190             can_issue_more--;
2191
2192           schedule_insn (insn, &ready, clock_var);
2193
2194         next:
2195           first_cycle_insn_p = 0;
2196
2197           if (targetm.sched.reorder2)
2198             {
2199               /* Sort the ready list based on priority.  */
2200               if (ready.n_ready > 0)
2201                 ready_sort (&ready);
2202               can_issue_more =
2203                 (*targetm.sched.reorder2) (sched_dump,sched_verbose,
2204                                            ready.n_ready
2205                                            ? ready_lastpos (&ready) : NULL,
2206                                            &ready.n_ready, clock_var);
2207             }
2208         }
2209
2210       if ((!targetm.sched.use_dfa_pipeline_interface
2211            || !(*targetm.sched.use_dfa_pipeline_interface) ())
2212           && sched_verbose)
2213         /* Debug info.  */
2214         visualize_scheduled_insns (clock_var);
2215     }
2216
2217   if (targetm.sched.md_finish)
2218     (*targetm.sched.md_finish) (sched_dump, sched_verbose);
2219
2220   /* Debug info.  */
2221   if (sched_verbose)
2222     {
2223       fprintf (sched_dump, ";;\tReady list (final):  ");
2224       debug_ready_list (&ready);
2225       if (!targetm.sched.use_dfa_pipeline_interface
2226           || !(*targetm.sched.use_dfa_pipeline_interface) ())
2227         print_block_visualization ("");
2228     }
2229
2230   /* Sanity check -- queue must be empty now.  Meaningless if region has
2231      multiple bbs.  */
2232   if (current_sched_info->queue_must_finish_empty && q_size != 0)
2233       abort ();
2234
2235   /* Update head/tail boundaries.  */
2236   head = NEXT_INSN (prev_head);
2237   tail = last_scheduled_insn;
2238
2239   /* Restore-other-notes: NOTE_LIST is the end of a chain of notes
2240      previously found among the insns.  Insert them at the beginning
2241      of the insns.  */
2242   if (note_list != 0)
2243     {
2244       rtx note_head = note_list;
2245
2246       while (PREV_INSN (note_head))
2247         {
2248           note_head = PREV_INSN (note_head);
2249         }
2250
2251       PREV_INSN (note_head) = PREV_INSN (head);
2252       NEXT_INSN (PREV_INSN (head)) = note_head;
2253       PREV_INSN (head) = note_list;
2254       NEXT_INSN (note_list) = head;
2255       head = note_head;
2256     }
2257
2258   /* Debugging.  */
2259   if (sched_verbose)
2260     {
2261       fprintf (sched_dump, ";;   total time = %d\n;;   new head = %d\n",
2262                clock_var, INSN_UID (head));
2263       fprintf (sched_dump, ";;   new tail = %d\n\n",
2264                INSN_UID (tail));
2265       visualize_free ();
2266     }
2267
2268   current_sched_info->head = head;
2269   current_sched_info->tail = tail;
2270
2271   free (ready.vec);
2272
2273   if (targetm.sched.use_dfa_pipeline_interface
2274       && (*targetm.sched.use_dfa_pipeline_interface) ())
2275     free (ready_try);
2276 }
2277 \f
2278 /* Set_priorities: compute priority of each insn in the block.  */
2279
2280 int
2281 set_priorities (head, tail)
2282      rtx head, tail;
2283 {
2284   rtx insn;
2285   int n_insn;
2286
2287   rtx prev_head;
2288
2289   prev_head = PREV_INSN (head);
2290
2291   if (head == tail && (! INSN_P (head)))
2292     return 0;
2293
2294   n_insn = 0;
2295   for (insn = tail; insn != prev_head; insn = PREV_INSN (insn))
2296     {
2297       if (GET_CODE (insn) == NOTE)
2298         continue;
2299
2300       if (!(SCHED_GROUP_P (insn)))
2301         n_insn++;
2302       (void) priority (insn);
2303     }
2304
2305   return n_insn;
2306 }
2307
2308 /* Initialize some global state for the scheduler.  DUMP_FILE is to be used
2309    for debugging output.  */
2310
2311 void
2312 sched_init (dump_file)
2313      FILE *dump_file;
2314 {
2315   int luid, b;
2316   rtx insn;
2317   int i;
2318
2319   /* Disable speculative loads in their presence if cc0 defined.  */
2320 #ifdef HAVE_cc0
2321   flag_schedule_speculative_load = 0;
2322 #endif
2323
2324   /* Set dump and sched_verbose for the desired debugging output.  If no
2325      dump-file was specified, but -fsched-verbose=N (any N), print to stderr.
2326      For -fsched-verbose=N, N>=10, print everything to stderr.  */
2327   sched_verbose = sched_verbose_param;
2328   if (sched_verbose_param == 0 && dump_file)
2329     sched_verbose = 1;
2330   sched_dump = ((sched_verbose_param >= 10 || !dump_file)
2331                 ? stderr : dump_file);
2332
2333   /* Initialize issue_rate.  */
2334   if (targetm.sched.issue_rate)
2335     issue_rate = (*targetm.sched.issue_rate) ();
2336   else
2337     issue_rate = 1;
2338
2339   /* We use LUID 0 for the fake insn (UID 0) which holds dependencies for
2340      pseudos which do not cross calls.  */
2341   old_max_uid = get_max_uid () + 1;
2342
2343   h_i_d = (struct haifa_insn_data *) xcalloc (old_max_uid, sizeof (*h_i_d));
2344
2345   for (i = 0; i < old_max_uid; i++)
2346     h_i_d [i].cost = -1;
2347
2348   if (targetm.sched.use_dfa_pipeline_interface
2349       && (*targetm.sched.use_dfa_pipeline_interface) ())
2350     {
2351       if (targetm.sched.init_dfa_pre_cycle_insn)
2352         (*targetm.sched.init_dfa_pre_cycle_insn) ();
2353
2354       if (targetm.sched.init_dfa_post_cycle_insn)
2355         (*targetm.sched.init_dfa_post_cycle_insn) ();
2356
2357       if (targetm.sched.first_cycle_multipass_dfa_lookahead
2358           && targetm.sched.init_dfa_bubbles)
2359         (*targetm.sched.init_dfa_bubbles) ();
2360
2361       dfa_start ();
2362       dfa_state_size = state_size ();
2363       curr_state = xmalloc (dfa_state_size);
2364     }
2365
2366   h_i_d[0].luid = 0;
2367   luid = 1;
2368   for (b = 0; b < n_basic_blocks; b++)
2369     for (insn = BLOCK_HEAD (b);; insn = NEXT_INSN (insn))
2370       {
2371         INSN_LUID (insn) = luid;
2372
2373         /* Increment the next luid, unless this is a note.  We don't
2374            really need separate IDs for notes and we don't want to
2375            schedule differently depending on whether or not there are
2376            line-number notes, i.e., depending on whether or not we're
2377            generating debugging information.  */
2378         if (GET_CODE (insn) != NOTE)
2379           ++luid;
2380
2381         if (insn == BLOCK_END (b))
2382           break;
2383       }
2384
2385   init_dependency_caches (luid);
2386
2387   compute_bb_for_insn (old_max_uid);
2388
2389   init_alias_analysis ();
2390
2391   if (write_symbols != NO_DEBUG)
2392     {
2393       rtx line;
2394
2395       line_note_head = (rtx *) xcalloc (n_basic_blocks, sizeof (rtx));
2396
2397       /* Save-line-note-head:
2398          Determine the line-number at the start of each basic block.
2399          This must be computed and saved now, because after a basic block's
2400          predecessor has been scheduled, it is impossible to accurately
2401          determine the correct line number for the first insn of the block.  */
2402
2403       for (b = 0; b < n_basic_blocks; b++)
2404         {
2405           for (line = BLOCK_HEAD (b); line; line = PREV_INSN (line))
2406             if (GET_CODE (line) == NOTE && NOTE_LINE_NUMBER (line) > 0)
2407               {
2408                 line_note_head[b] = line;
2409                 break;
2410               }
2411           /* Do a forward search as well, since we won't get to see the first
2412              notes in a basic block.  */
2413           for (line = BLOCK_HEAD (b); line; line = NEXT_INSN (line))
2414             {
2415               if (INSN_P (line))
2416                 break;
2417               if (GET_CODE (line) == NOTE && NOTE_LINE_NUMBER (line) > 0)
2418                 line_note_head[b] = line;
2419             }
2420         }
2421     }
2422
2423   if ((!targetm.sched.use_dfa_pipeline_interface
2424        || !(*targetm.sched.use_dfa_pipeline_interface) ())
2425       && sched_verbose)
2426     /* Find units used in this function, for visualization.  */
2427     init_target_units ();
2428
2429   /* ??? Add a NOTE after the last insn of the last basic block.  It is not
2430      known why this is done.  */
2431
2432   insn = BLOCK_END (n_basic_blocks - 1);
2433   if (NEXT_INSN (insn) == 0
2434       || (GET_CODE (insn) != NOTE
2435           && GET_CODE (insn) != CODE_LABEL
2436           /* Don't emit a NOTE if it would end up before a BARRIER.  */
2437           && GET_CODE (NEXT_INSN (insn)) != BARRIER))
2438     {
2439       emit_note_after (NOTE_INSN_DELETED, BLOCK_END (n_basic_blocks - 1));
2440       /* Make insn to appear outside BB.  */
2441       BLOCK_END (n_basic_blocks - 1) = PREV_INSN (BLOCK_END (n_basic_blocks - 1));
2442     }
2443
2444   /* Compute INSN_REG_WEIGHT for all blocks.  We must do this before
2445      removing death notes.  */
2446   for (b = n_basic_blocks - 1; b >= 0; b--)
2447     find_insn_reg_weight (b);
2448 }
2449
2450 /* Free global data used during insn scheduling.  */
2451
2452 void
2453 sched_finish ()
2454 {
2455   free (h_i_d);
2456
2457   if (targetm.sched.use_dfa_pipeline_interface
2458       && (*targetm.sched.use_dfa_pipeline_interface) ())
2459     {
2460       free (curr_state);
2461       dfa_finish ();
2462     }
2463   free_dependency_caches ();
2464   end_alias_analysis ();
2465   if (write_symbols != NO_DEBUG)
2466     free (line_note_head);
2467 }
2468 #endif /* INSN_SCHEDULING */