gcc/loop.c

   1 /* Perform various loop optimizations, including strength reduction.
   2    Copyright (C) 1987, 1988, 1989, 1991, 1992, 1993, 1994, 1995,
   3    1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005
   4    Free Software Foundation, Inc.
   5
   6 This file is part of GCC.
   7
   8 GCC is free software; you can redistribute it and/or modify it under
   9 the terms of the GNU General Public License as published by the Free
  10 Software Foundation; either version 2, or (at your option) any later
  11 version.
  12
  13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  15 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  16 for more details.
  17
  18 You should have received a copy of the GNU General Public License
  19 along with GCC; see the file COPYING.  If not, write to the Free
  20 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  21 02111-1307, USA.  */
  22
  23 /* This is the loop optimization pass of the compiler.
  24    It finds invariant computations within loops and moves them
  25    to the beginning of the loop.  Then it identifies basic and
  26    general induction variables.
  27
  28    Basic induction variables (BIVs) are a pseudo registers which are set within
  29    a loop only by incrementing or decrementing its value.  General induction
  30    variables (GIVs) are pseudo registers with a value which is a linear function
  31    of a basic induction variable.  BIVs are recognized by `basic_induction_var';
  32    GIVs by `general_induction_var'.
  33
  34    Once induction variables are identified, strength reduction is applied to the
  35    general induction variables, and induction variable elimination is applied to
  36    the basic induction variables.
  37
  38    It also finds cases where
  39    a register is set within the loop by zero-extending a narrower value
  40    and changes these to zero the entire register once before the loop
  41    and merely copy the low part within the loop.
  42
  43    Most of the complexity is in heuristics to decide when it is worth
  44    while to do these things.  */
  45
  46 #include "config.h"
  47 #include "system.h"
  48 #include "coretypes.h"
  49 #include "tm.h"
  50 #include "rtl.h"
  51 #include "tm_p.h"
  52 #include "function.h"
  53 #include "expr.h"
  54 #include "hard-reg-set.h"
  55 #include "basic-block.h"
  56 #include "insn-config.h"
  57 #include "regs.h"
  58 #include "recog.h"
  59 #include "flags.h"
  60 #include "real.h"
  61 #include "cselib.h"
  62 #include "except.h"
  63 #include "toplev.h"
  64 #include "predict.h"
  65 #include "insn-flags.h"
  66 #include "optabs.h"
  67 #include "cfgloop.h"
  68 #include "ggc.h"
  69
  70 /* Get the loop info pointer of a loop.  */
  71 #define LOOP_INFO(LOOP) ((struct loop_info *) (LOOP)->aux)
  72
  73 /* Get a pointer to the loop movables structure.  */
  74 #define LOOP_MOVABLES(LOOP) (&LOOP_INFO (LOOP)->movables)
  75
  76 /* Get a pointer to the loop registers structure.  */
  77 #define LOOP_REGS(LOOP) (&LOOP_INFO (LOOP)->regs)
  78
  79 /* Get a pointer to the loop induction variables structure.  */
  80 #define LOOP_IVS(LOOP) (&LOOP_INFO (LOOP)->ivs)
  81
  82 /* Get the luid of an insn.  Catch the error of trying to reference the LUID
  83    of an insn added during loop, since these don't have LUIDs.  */
  84
  85 #define INSN_LUID(INSN)                 \
  86   (gcc_assert (INSN_UID (INSN) < max_uid_for_loop), uid_luid[INSN_UID (INSN)])
  87
  88 #define REGNO_FIRST_LUID(REGNO)                 \
  89   (REGNO_FIRST_UID (REGNO) < max_uid_for_loop   \
  90         ? uid_luid[REGNO_FIRST_UID (REGNO)]     \
  91         : 0)
  92 #define REGNO_LAST_LUID(REGNO)                  \
  93   (REGNO_LAST_UID (REGNO) < max_uid_for_loop    \
  94         ? uid_luid[REGNO_LAST_UID (REGNO)]      \
  95         : INT_MAX)
  96
  97 /* A "basic induction variable" or biv is a pseudo reg that is set
  98    (within this loop) only by incrementing or decrementing it.  */
  99 /* A "general induction variable" or giv is a pseudo reg whose
 100    value is a linear function of a biv.  */
 101
 102 /* Bivs are recognized by `basic_induction_var';
 103    Givs by `general_induction_var'.  */
 104
 105 /* An enum for the two different types of givs, those that are used
 106    as memory addresses and those that are calculated into registers.  */
 107 enum g_types
 108 {
 109   DEST_ADDR,
 110   DEST_REG
 111 };
 112
 113
 114 /* A `struct induction' is created for every instruction that sets
 115    an induction variable (either a biv or a giv).  */
 116
 117 struct induction
 118 {
 119   rtx insn;                     /* The insn that sets a biv or giv */
 120   rtx new_reg;                  /* New register, containing strength reduced
 121                                    version of this giv.  */
 122   rtx src_reg;                  /* Biv from which this giv is computed.
 123                                    (If this is a biv, then this is the biv.) */
 124   enum g_types giv_type;        /* Indicate whether DEST_ADDR or DEST_REG */
 125   rtx dest_reg;                 /* Destination register for insn: this is the
 126                                    register which was the biv or giv.
 127                                    For a biv, this equals src_reg.
 128                                    For a DEST_ADDR type giv, this is 0.  */
 129   rtx *location;                /* Place in the insn where this giv occurs.
 130                                    If GIV_TYPE is DEST_REG, this is 0.  */
 131                                 /* For a biv, this is the place where add_val
 132                                    was found.  */
 133   enum machine_mode mode;       /* The mode of this biv or giv */
 134   rtx mem;                      /* For DEST_ADDR, the memory object.  */
 135   rtx mult_val;                 /* Multiplicative factor for src_reg.  */
 136   rtx add_val;                  /* Additive constant for that product.  */
 137   int benefit;                  /* Gain from eliminating this insn.  */
 138   rtx final_value;              /* If the giv is used outside the loop, and its
 139                                    final value could be calculated, it is put
 140                                    here, and the giv is made replaceable.  Set
 141                                    the giv to this value before the loop.  */
 142   unsigned combined_with;       /* The number of givs this giv has been
 143                                    combined with.  If nonzero, this giv
 144                                    cannot combine with any other giv.  */
 145   unsigned replaceable : 1;     /* 1 if we can substitute the strength-reduced
 146                                    variable for the original variable.
 147                                    0 means they must be kept separate and the
 148                                    new one must be copied into the old pseudo
 149                                    reg each time the old one is set.  */
 150   unsigned not_replaceable : 1; /* Used to prevent duplicating work.  This is
 151                                    1 if we know that the giv definitely can
 152                                    not be made replaceable, in which case we
 153                                    don't bother checking the variable again
 154                                    even if further info is available.
 155                                    Both this and the above can be zero.  */
 156   unsigned ignore : 1;          /* 1 prohibits further processing of giv */
 157   unsigned always_computable : 1;/* 1 if this value is computable every
 158                                     iteration.  */
 159   unsigned always_executed : 1; /* 1 if this set occurs each iteration.  */
 160   unsigned maybe_multiple : 1;  /* Only used for a biv and  1 if this biv
 161                                    update may be done multiple times per
 162                                    iteration.  */
 163   unsigned cant_derive : 1;     /* For giv's, 1 if this giv cannot derive
 164                                    another giv.  This occurs in many cases
 165                                    where a giv's lifetime spans an update to
 166                                    a biv.  */
 167   unsigned maybe_dead : 1;      /* 1 if this giv might be dead.  In that case,
 168                                    we won't use it to eliminate a biv, it
 169                                    would probably lose.  */
 170   unsigned auto_inc_opt : 1;    /* 1 if this giv had its increment output next
 171                                    to it to try to form an auto-inc address.  */
 172   unsigned shared : 1;
 173   unsigned no_const_addval : 1; /* 1 if add_val does not contain a const.  */
 174   int lifetime;                 /* Length of life of this giv */
 175   rtx derive_adjustment;        /* If nonzero, is an adjustment to be
 176                                    subtracted from add_val when this giv
 177                                    derives another.  This occurs when the
 178                                    giv spans a biv update by incrementation.  */
 179   rtx ext_dependent;            /* If nonzero, is a sign or zero extension
 180                                    if a biv on which this giv is dependent.  */
 181   struct induction *next_iv;    /* For givs, links together all givs that are
 182                                    based on the same biv.  For bivs, links
 183                                    together all biv entries that refer to the
 184                                    same biv register.  */
 185   struct induction *same;       /* For givs, if the giv has been combined with
 186                                    another giv, this points to the base giv.
 187                                    The base giv will have COMBINED_WITH nonzero.
 188                                    For bivs, if the biv has the same LOCATION
 189                                    than another biv, this points to the base
 190                                    biv.  */
 191   struct induction *same_insn;  /* If there are multiple identical givs in
 192                                    the same insn, then all but one have this
 193                                    field set, and they all point to the giv
 194                                    that doesn't have this field set.  */
 195   rtx last_use;                 /* For a giv made from a biv increment, this is
 196                                    a substitute for the lifetime information.  */
 197 };
 198
 199
 200 /* A `struct iv_class' is created for each biv.  */
 201
 202 struct iv_class
 203 {
 204   unsigned int regno;           /* Pseudo reg which is the biv.  */
 205   int biv_count;                /* Number of insns setting this reg.  */
 206   struct induction *biv;        /* List of all insns that set this reg.  */
 207   int giv_count;                /* Number of DEST_REG givs computed from this
 208                                    biv.  The resulting count is only used in
 209                                    check_dbra_loop.  */
 210   struct induction *giv;        /* List of all insns that compute a giv
 211                                    from this reg.  */
 212   int total_benefit;            /* Sum of BENEFITs of all those givs.  */
 213   rtx initial_value;            /* Value of reg at loop start.  */
 214   rtx initial_test;             /* Test performed on BIV before loop.  */
 215   rtx final_value;              /* Value of reg at loop end, if known.  */
 216   struct iv_class *next;        /* Links all class structures together.  */
 217   rtx init_insn;                /* insn which initializes biv, 0 if none.  */
 218   rtx init_set;                 /* SET of INIT_INSN, if any.  */
 219   unsigned incremented : 1;     /* 1 if somewhere incremented/decremented */
 220   unsigned eliminable : 1;      /* 1 if plausible candidate for
 221                                    elimination.  */
 222   unsigned nonneg : 1;          /* 1 if we added a REG_NONNEG note for
 223                                    this.  */
 224   unsigned reversed : 1;        /* 1 if we reversed the loop that this
 225                                    biv controls.  */
 226   unsigned all_reduced : 1;     /* 1 if all givs using this biv have
 227                                    been reduced.  */
 228 };
 229
 230
 231 /* Definitions used by the basic induction variable discovery code.  */
 232 enum iv_mode
 233 {
 234   UNKNOWN_INDUCT,
 235   BASIC_INDUCT,
 236   NOT_BASIC_INDUCT,
 237   GENERAL_INDUCT
 238 };
 239
 240
 241 /* A `struct iv' is created for every register.  */
 242
 243 struct iv
 244 {
 245   enum iv_mode type;
 246   union
 247   {
 248     struct iv_class *class;
 249     struct induction *info;
 250   } iv;
 251 };
 252
 253
 254 #define REG_IV_TYPE(ivs, n) ivs->regs[n].type
 255 #define REG_IV_INFO(ivs, n) ivs->regs[n].iv.info
 256 #define REG_IV_CLASS(ivs, n) ivs->regs[n].iv.class
 257
 258
 259 struct loop_ivs
 260 {
 261   /* Indexed by register number, contains pointer to `struct
 262      iv' if register is an induction variable.  */
 263   struct iv *regs;
 264
 265   /* Size of regs array.  */
 266   unsigned int n_regs;
 267
 268   /* The head of a list which links together (via the next field)
 269      every iv class for the current loop.  */
 270   struct iv_class *list;
 271 };
 272
 273
 274 typedef struct loop_mem_info
 275 {
 276   rtx mem;      /* The MEM itself.  */
 277   rtx reg;      /* Corresponding pseudo, if any.  */
 278   int optimize; /* Nonzero if we can optimize access to this MEM.  */
 279 } loop_mem_info;
 280
 281
 282
 283 struct loop_reg
 284 {
 285   /* Number of times the reg is set during the loop being scanned.
 286      During code motion, a negative value indicates a reg that has
 287      been made a candidate; in particular -2 means that it is an
 288      candidate that we know is equal to a constant and -1 means that
 289      it is a candidate not known equal to a constant.  After code
 290      motion, regs moved have 0 (which is accurate now) while the
 291      failed candidates have the original number of times set.
 292
 293      Therefore, at all times, == 0 indicates an invariant register;
 294      < 0 a conditionally invariant one.  */
 295   int set_in_loop;
 296
 297   /* Original value of set_in_loop; same except that this value
 298      is not set negative for a reg whose sets have been made candidates
 299      and not set to 0 for a reg that is moved.  */
 300   int n_times_set;
 301
 302   /* Contains the insn in which a register was used if it was used
 303      exactly once; contains const0_rtx if it was used more than once.  */
 304   rtx single_usage;
 305
 306   /* Nonzero indicates that the register cannot be moved or strength
 307      reduced.  */
 308   char may_not_optimize;
 309
 310   /* Nonzero means reg N has already been moved out of one loop.
 311      This reduces the desire to move it out of another.  */
 312   char moved_once;
 313 };
 314
 315
 316 struct loop_regs
 317 {
 318   int num;                      /* Number of regs used in table.  */
 319   int size;                     /* Size of table.  */
 320   struct loop_reg *array;       /* Register usage info. array.  */
 321   int multiple_uses;            /* Nonzero if a reg has multiple uses.  */
 322 };
 323
 324
 325
 326 struct loop_movables
 327 {
 328   /* Head of movable chain.  */
 329   struct movable *head;
 330   /* Last movable in chain.  */
 331   struct movable *last;
 332 };
 333
 334
 335 /* Information pertaining to a loop.  */
 336
 337 struct loop_info
 338 {
 339   /* Nonzero if there is a subroutine call in the current loop.  */
 340   int has_call;
 341   /* Nonzero if there is a libcall in the current loop.  */
 342   int has_libcall;
 343   /* Nonzero if there is a non constant call in the current loop.  */
 344   int has_nonconst_call;
 345   /* Nonzero if there is a prefetch instruction in the current loop.  */
 346   int has_prefetch;
 347   /* Nonzero if there is a volatile memory reference in the current
 348      loop.  */
 349   int has_volatile;
 350   /* Nonzero if there is a tablejump in the current loop.  */
 351   int has_tablejump;
 352   /* Nonzero if there are ways to leave the loop other than falling
 353      off the end.  */
 354   int has_multiple_exit_targets;
 355   /* Nonzero if there is an indirect jump in the current function.  */
 356   int has_indirect_jump;
 357   /* Register or constant initial loop value.  */
 358   rtx initial_value;
 359   /* Register or constant value used for comparison test.  */
 360   rtx comparison_value;
 361   /* Register or constant approximate final value.  */
 362   rtx final_value;
 363   /* Register or constant initial loop value with term common to
 364      final_value removed.  */
 365   rtx initial_equiv_value;
 366   /* Register or constant final loop value with term common to
 367      initial_value removed.  */
 368   rtx final_equiv_value;
 369   /* Register corresponding to iteration variable.  */
 370   rtx iteration_var;
 371   /* Constant loop increment.  */
 372   rtx increment;
 373   enum rtx_code comparison_code;
 374   /* Holds the number of loop iterations.  It is zero if the number
 375      could not be calculated.  Must be unsigned since the number of
 376      iterations can be as high as 2^wordsize - 1.  For loops with a
 377      wider iterator, this number will be zero if the number of loop
 378      iterations is too large for an unsigned integer to hold.  */
 379   unsigned HOST_WIDE_INT n_iterations;
 380   int used_count_register;
 381   /* The loop iterator induction variable.  */
 382   struct iv_class *iv;
 383   /* List of MEMs that are stored in this loop.  */
 384   rtx store_mems;
 385   /* Array of MEMs that are used (read or written) in this loop, but
 386      cannot be aliased by anything in this loop, except perhaps
 387      themselves.  In other words, if mems[i] is altered during
 388      the loop, it is altered by an expression that is rtx_equal_p to
 389      it.  */
 390   loop_mem_info *mems;
 391   /* The index of the next available slot in MEMS.  */
 392   int mems_idx;
 393   /* The number of elements allocated in MEMS.  */
 394   int mems_allocated;
 395   /* Nonzero if we don't know what MEMs were changed in the current
 396      loop.  This happens if the loop contains a call (in which case
 397      `has_call' will also be set) or if we store into more than
 398      NUM_STORES MEMs.  */
 399   int unknown_address_altered;
 400   /* The above doesn't count any readonly memory locations that are
 401      stored.  This does.  */
 402   int unknown_constant_address_altered;
 403   /* Count of memory write instructions discovered in the loop.  */
 404   int num_mem_sets;
 405   /* The insn where the first of these was found.  */
 406   rtx first_loop_store_insn;
 407   /* The chain of movable insns in loop.  */
 408   struct loop_movables movables;
 409   /* The registers used the in loop.  */
 410   struct loop_regs regs;
 411   /* The induction variable information in loop.  */
 412   struct loop_ivs ivs;
 413   /* Nonzero if call is in pre_header extended basic block.  */
 414   int pre_header_has_call;
 415 };
 416
 417 /* Not really meaningful values, but at least something.  */
 418 #ifndef SIMULTANEOUS_PREFETCHES
 419 #define SIMULTANEOUS_PREFETCHES 3
 420 #endif
 421 #ifndef PREFETCH_BLOCK
 422 #define PREFETCH_BLOCK 32
 423 #endif
 424 #ifndef HAVE_prefetch
 425 #define HAVE_prefetch 0
 426 #define CODE_FOR_prefetch 0
 427 #define gen_prefetch(a,b,c) (gcc_unreachable (), NULL_RTX)
 428 #endif
 429
 430 /* Give up the prefetch optimizations once we exceed a given threshold.
 431    It is unlikely that we would be able to optimize something in a loop
 432    with so many detected prefetches.  */
 433 #define MAX_PREFETCHES 100
 434 /* The number of prefetch blocks that are beneficial to fetch at once before
 435    a loop with a known (and low) iteration count.  */
 436 #define PREFETCH_BLOCKS_BEFORE_LOOP_MAX  6
 437 /* For very tiny loops it is not worthwhile to prefetch even before the loop,
 438    since it is likely that the data are already in the cache.  */
 439 #define PREFETCH_BLOCKS_BEFORE_LOOP_MIN  2
 440
 441 /* Parameterize some prefetch heuristics so they can be turned on and off
 442    easily for performance testing on new architectures.  These can be
 443    defined in target-dependent files.  */
 444
 445 /* Prefetch is worthwhile only when loads/stores are dense.  */
 446 #ifndef PREFETCH_ONLY_DENSE_MEM
 447 #define PREFETCH_ONLY_DENSE_MEM 1
 448 #endif
 449
 450 /* Define what we mean by "dense" loads and stores; This value divided by 256
 451    is the minimum percentage of memory references that worth prefetching.  */
 452 #ifndef PREFETCH_DENSE_MEM
 453 #define PREFETCH_DENSE_MEM 220
 454 #endif
 455
 456 /* Do not prefetch for a loop whose iteration count is known to be low.  */
 457 #ifndef PREFETCH_NO_LOW_LOOPCNT
 458 #define PREFETCH_NO_LOW_LOOPCNT 1
 459 #endif
 460
 461 /* Define what we mean by a "low" iteration count.  */
 462 #ifndef PREFETCH_LOW_LOOPCNT
 463 #define PREFETCH_LOW_LOOPCNT 32
 464 #endif
 465
 466 /* Do not prefetch for a loop that contains a function call; such a loop is
 467    probably not an internal loop.  */
 468 #ifndef PREFETCH_NO_CALL
 469 #define PREFETCH_NO_CALL 1
 470 #endif
 471
 472 /* Do not prefetch accesses with an extreme stride.  */
 473 #ifndef PREFETCH_NO_EXTREME_STRIDE
 474 #define PREFETCH_NO_EXTREME_STRIDE 1
 475 #endif
 476
 477 /* Define what we mean by an "extreme" stride.  */
 478 #ifndef PREFETCH_EXTREME_STRIDE
 479 #define PREFETCH_EXTREME_STRIDE 4096
 480 #endif
 481
 482 /* Define a limit to how far apart indices can be and still be merged
 483    into a single prefetch.  */
 484 #ifndef PREFETCH_EXTREME_DIFFERENCE
 485 #define PREFETCH_EXTREME_DIFFERENCE 4096
 486 #endif
 487
 488 /* Issue prefetch instructions before the loop to fetch data to be used
 489    in the first few loop iterations.  */
 490 #ifndef PREFETCH_BEFORE_LOOP
 491 #define PREFETCH_BEFORE_LOOP 1
 492 #endif
 493
 494 /* Do not handle reversed order prefetches (negative stride).  */
 495 #ifndef PREFETCH_NO_REVERSE_ORDER
 496 #define PREFETCH_NO_REVERSE_ORDER 1
 497 #endif
 498
 499 /* Prefetch even if the GIV is in conditional code.  */
 500 #ifndef PREFETCH_CONDITIONAL
 501 #define PREFETCH_CONDITIONAL 1
 502 #endif
 503
 504 #define LOOP_REG_LIFETIME(LOOP, REGNO) \
 505 ((REGNO_LAST_LUID (REGNO) - REGNO_FIRST_LUID (REGNO)))
 506
 507 #define LOOP_REG_GLOBAL_P(LOOP, REGNO) \
 508 ((REGNO_LAST_LUID (REGNO) > INSN_LUID ((LOOP)->end) \
 509  || REGNO_FIRST_LUID (REGNO) < INSN_LUID ((LOOP)->start)))
 510
 511 #define LOOP_REGNO_NREGS(REGNO, SET_DEST) \
 512 ((REGNO) < FIRST_PSEUDO_REGISTER \
 513  ? (int) hard_regno_nregs[(REGNO)][GET_MODE (SET_DEST)] : 1)
 514
 515
 516 /* Vector mapping INSN_UIDs to luids.
 517    The luids are like uids but increase monotonically always.
 518    We use them to see whether a jump comes from outside a given loop.  */
 519
 520 static int *uid_luid;
 521
 522 /* Indexed by INSN_UID, contains the ordinal giving the (innermost) loop
 523    number the insn is contained in.  */
 524
 525 static struct loop **uid_loop;
 526
 527 /* 1 + largest uid of any insn.  */
 528
 529 static int max_uid_for_loop;
 530
 531 /* Number of loops detected in current function.  Used as index to the
 532    next few tables.  */
 533
 534 static int max_loop_num;
 535
 536 /* Bound on pseudo register number before loop optimization.
 537    A pseudo has valid regscan info if its number is < max_reg_before_loop.  */
 538 static unsigned int max_reg_before_loop;
 539
 540 /* The value to pass to the next call of reg_scan_update.  */
 541 static int loop_max_reg;
 542 \f
 543 /* During the analysis of a loop, a chain of `struct movable's
 544    is made to record all the movable insns found.
 545    Then the entire chain can be scanned to decide which to move.  */
 546
 547 struct movable
 548 {
 549   rtx insn;                     /* A movable insn */
 550   rtx set_src;                  /* The expression this reg is set from.  */
 551   rtx set_dest;                 /* The destination of this SET.  */
 552   rtx dependencies;             /* When INSN is libcall, this is an EXPR_LIST
 553                                    of any registers used within the LIBCALL.  */
 554   int consec;                   /* Number of consecutive following insns
 555                                    that must be moved with this one.  */
 556   unsigned int regno;           /* The register it sets */
 557   short lifetime;               /* lifetime of that register;
 558                                    may be adjusted when matching movables
 559                                    that load the same value are found.  */
 560   short savings;                /* Number of insns we can move for this reg,
 561                                    including other movables that force this
 562                                    or match this one.  */
 563   ENUM_BITFIELD(machine_mode) savemode : 8;   /* Nonzero means it is a mode for
 564                                    a low part that we should avoid changing when
 565                                    clearing the rest of the reg.  */
 566   unsigned int cond : 1;        /* 1 if only conditionally movable */
 567   unsigned int force : 1;       /* 1 means MUST move this insn */
 568   unsigned int global : 1;      /* 1 means reg is live outside this loop */
 569                 /* If PARTIAL is 1, GLOBAL means something different:
 570                    that the reg is live outside the range from where it is set
 571                    to the following label.  */
 572   unsigned int done : 1;        /* 1 inhibits further processing of this */
 573
 574   unsigned int partial : 1;     /* 1 means this reg is used for zero-extending.
 575                                    In particular, moving it does not make it
 576                                    invariant.  */
 577   unsigned int move_insn : 1;   /* 1 means that we call emit_move_insn to
 578                                    load SRC, rather than copying INSN.  */
 579   unsigned int move_insn_first:1;/* Same as above, if this is necessary for the
 580                                     first insn of a consecutive sets group.  */
 581   unsigned int is_equiv : 1;    /* 1 means a REG_EQUIV is present on INSN.  */
 582   unsigned int insert_temp : 1;  /* 1 means we copy to a new pseudo and replace
 583                                     the original insn with a copy from that
 584                                     pseudo, rather than deleting it.  */
 585   struct movable *match;        /* First entry for same value */
 586   struct movable *forces;       /* An insn that must be moved if this is */
 587   struct movable *next;
 588 };
 589
 590
 591 static FILE *loop_dump_stream;
 592
 593 /* Forward declarations.  */
 594
 595 static void invalidate_loops_containing_label (rtx);
 596 static void find_and_verify_loops (rtx, struct loops *);
 597 static void mark_loop_jump (rtx, struct loop *);
 598 static void prescan_loop (struct loop *);
 599 static int reg_in_basic_block_p (rtx, rtx);
 600 static int consec_sets_invariant_p (const struct loop *, rtx, int, rtx);
 601 static int labels_in_range_p (rtx, int);
 602 static void count_one_set (struct loop_regs *, rtx, rtx, rtx *);
 603 static void note_addr_stored (rtx, rtx, void *);
 604 static void note_set_pseudo_multiple_uses (rtx, rtx, void *);
 605 static int loop_reg_used_before_p (const struct loop *, rtx, rtx);
 606 static rtx find_regs_nested (rtx, rtx);
 607 static void scan_loop (struct loop*, int);
 608 #if 0
 609 static void replace_call_address (rtx, rtx, rtx);
 610 #endif
 611 static rtx skip_consec_insns (rtx, int);
 612 static int libcall_benefit (rtx);
 613 static rtx libcall_other_reg (rtx, rtx);
 614 static void record_excess_regs (rtx, rtx, rtx *);
 615 static void ignore_some_movables (struct loop_movables *);
 616 static void force_movables (struct loop_movables *);
 617 static void combine_movables (struct loop_movables *, struct loop_regs *);
 618 static int num_unmoved_movables (const struct loop *);
 619 static int regs_match_p (rtx, rtx, struct loop_movables *);
 620 static int rtx_equal_for_loop_p (rtx, rtx, struct loop_movables *,
 621                                  struct loop_regs *);
 622 static void add_label_notes (rtx, rtx);
 623 static void move_movables (struct loop *loop, struct loop_movables *, int,
 624                            int);
 625 static void loop_movables_add (struct loop_movables *, struct movable *);
 626 static void loop_movables_free (struct loop_movables *);
 627 static int count_nonfixed_reads (const struct loop *, rtx);
 628 static void loop_bivs_find (struct loop *);
 629 static void loop_bivs_init_find (struct loop *);
 630 static void loop_bivs_check (struct loop *);
 631 static void loop_givs_find (struct loop *);
 632 static void loop_givs_check (struct loop *);
 633 static int loop_biv_eliminable_p (struct loop *, struct iv_class *, int, int);
 634 static int loop_giv_reduce_benefit (struct loop *, struct iv_class *,
 635                                     struct induction *, rtx);
 636 static void loop_givs_dead_check (struct loop *, struct iv_class *);
 637 static void loop_givs_reduce (struct loop *, struct iv_class *);
 638 static void loop_givs_rescan (struct loop *, struct iv_class *, rtx *);
 639 static void loop_ivs_free (struct loop *);
 640 static void strength_reduce (struct loop *, int);
 641 static void find_single_use_in_loop (struct loop_regs *, rtx, rtx);
 642 static int valid_initial_value_p (rtx, rtx, int, rtx);
 643 static void find_mem_givs (const struct loop *, rtx, rtx, int, int);
 644 static void record_biv (struct loop *, struct induction *, rtx, rtx, rtx,
 645                         rtx, rtx *, int, int);
 646 static void check_final_value (const struct loop *, struct induction *);
 647 static void loop_ivs_dump (const struct loop *, FILE *, int);
 648 static void loop_iv_class_dump (const struct iv_class *, FILE *, int);
 649 static void loop_biv_dump (const struct induction *, FILE *, int);
 650 static void loop_giv_dump (const struct induction *, FILE *, int);
 651 static void record_giv (const struct loop *, struct induction *, rtx, rtx,
 652                         rtx, rtx, rtx, rtx, int, enum g_types, int, int,
 653                         rtx *);
 654 static void update_giv_derive (const struct loop *, rtx);
 655 static HOST_WIDE_INT get_monotonic_increment (struct iv_class *);
 656 static bool biased_biv_fits_mode_p (const struct loop *, struct iv_class *,
 657                                     HOST_WIDE_INT, enum machine_mode,
 658                                     unsigned HOST_WIDE_INT);
 659 static bool biv_fits_mode_p (const struct loop *, struct iv_class *,
 660                              HOST_WIDE_INT, enum machine_mode, bool);
 661 static bool extension_within_bounds_p (const struct loop *, struct iv_class *,
 662                                        HOST_WIDE_INT, rtx);
 663 static void check_ext_dependent_givs (const struct loop *, struct iv_class *);
 664 static int basic_induction_var (const struct loop *, rtx, enum machine_mode,
 665                                 rtx, rtx, rtx *, rtx *, rtx **);
 666 static rtx simplify_giv_expr (const struct loop *, rtx, rtx *, int *);
 667 static int general_induction_var (const struct loop *loop, rtx, rtx *, rtx *,
 668                                   rtx *, rtx *, int, int *, enum machine_mode);
 669 static int consec_sets_giv (const struct loop *, int, rtx, rtx, rtx, rtx *,
 670                             rtx *, rtx *, rtx *);
 671 static int check_dbra_loop (struct loop *, int);
 672 static rtx express_from_1 (rtx, rtx, rtx);
 673 static rtx combine_givs_p (struct induction *, struct induction *);
 674 static int cmp_combine_givs_stats (const void *, const void *);
 675 static void combine_givs (struct loop_regs *, struct iv_class *);
 676 static int product_cheap_p (rtx, rtx);
 677 static int maybe_eliminate_biv (const struct loop *, struct iv_class *, int,
 678                                 int, int);
 679 static int maybe_eliminate_biv_1 (const struct loop *, rtx, rtx,
 680                                   struct iv_class *, int, basic_block, rtx);
 681 static int last_use_this_basic_block (rtx, rtx);
 682 static void record_initial (rtx, rtx, void *);
 683 static void update_reg_last_use (rtx, rtx);
 684 static rtx next_insn_in_loop (const struct loop *, rtx);
 685 static void loop_regs_scan (const struct loop *, int);
 686 static int count_insns_in_loop (const struct loop *);
 687 static int find_mem_in_note_1 (rtx *, void *);
 688 static rtx find_mem_in_note (rtx);
 689 static void load_mems (const struct loop *);
 690 static int insert_loop_mem (rtx *, void *);
 691 static int replace_loop_mem (rtx *, void *);
 692 static void replace_loop_mems (rtx, rtx, rtx, int);
 693 static int replace_loop_reg (rtx *, void *);
 694 static void replace_loop_regs (rtx insn, rtx, rtx);
 695 static void note_reg_stored (rtx, rtx, void *);
 696 static void try_copy_prop (const struct loop *, rtx, unsigned int);
 697 static void try_swap_copy_prop (const struct loop *, rtx, unsigned int);
 698 static rtx check_insn_for_givs (struct loop *, rtx, int, int);
 699 static rtx check_insn_for_bivs (struct loop *, rtx, int, int);
 700 static rtx gen_add_mult (rtx, rtx, rtx, rtx);
 701 static void loop_regs_update (const struct loop *, rtx);
 702 static int iv_add_mult_cost (rtx, rtx, rtx, rtx);
 703 static int loop_invariant_p (const struct loop *, rtx);
 704 static rtx loop_insn_hoist (const struct loop *, rtx);
 705 static void loop_iv_add_mult_emit_before (const struct loop *, rtx, rtx, rtx,
 706                                           rtx, basic_block, rtx);
 707 static rtx loop_insn_emit_before (const struct loop *, basic_block,
 708                                   rtx, rtx);
 709 static int loop_insn_first_p (rtx, rtx);
 710 static rtx get_condition_for_loop (const struct loop *, rtx);
 711 static void loop_iv_add_mult_sink (const struct loop *, rtx, rtx, rtx, rtx);
 712 static void loop_iv_add_mult_hoist (const struct loop *, rtx, rtx, rtx, rtx);
 713 static rtx extend_value_for_giv (struct induction *, rtx);
 714 static rtx loop_insn_sink (const struct loop *, rtx);
 715
 716 static rtx loop_insn_emit_after (const struct loop *, basic_block, rtx, rtx);
 717 static rtx loop_call_insn_emit_before (const struct loop *, basic_block,
 718                                        rtx, rtx);
 719 static rtx loop_call_insn_hoist (const struct loop *, rtx);
 720 static rtx loop_insn_sink_or_swim (const struct loop *, rtx);
 721
 722 static void loop_dump_aux (const struct loop *, FILE *, int);
 723 static void loop_delete_insns (rtx, rtx);
 724 static HOST_WIDE_INT remove_constant_addition (rtx *);
 725 static rtx gen_load_of_final_value (rtx, rtx);
 726 void debug_ivs (const struct loop *);
 727 void debug_iv_class (const struct iv_class *);
 728 void debug_biv (const struct induction *);
 729 void debug_giv (const struct induction *);
 730 void debug_loop (const struct loop *);
 731 void debug_loops (const struct loops *);
 732
 733 typedef struct loop_replace_args
 734 {
 735   rtx match;
 736   rtx replacement;
 737   rtx insn;
 738 } loop_replace_args;
 739
 740 /* Nonzero iff INSN is between START and END, inclusive.  */
 741 #define INSN_IN_RANGE_P(INSN, START, END)       \
 742   (INSN_UID (INSN) < max_uid_for_loop           \
 743    && INSN_LUID (INSN) >= INSN_LUID (START)     \
 744    && INSN_LUID (INSN) <= INSN_LUID (END))
 745
 746 /* Indirect_jump_in_function is computed once per function.  */
 747 static int indirect_jump_in_function;
 748 static int indirect_jump_in_function_p (rtx);
 749
 750 static int compute_luids (rtx, rtx, int);
 751
 752 static int biv_elimination_giv_has_0_offset (struct induction *,
 753                                              struct induction *, rtx);
 754 \f
 755 /* Benefit penalty, if a giv is not replaceable, i.e. must emit an insn to
 756    copy the value of the strength reduced giv to its original register.  */
 757 static int copy_cost;
 758
 759 /* Cost of using a register, to normalize the benefits of a giv.  */
 760 static int reg_address_cost;
 761
 762 void
 763 init_loop (void)
 764 {
 765   rtx reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
 766
 767   reg_address_cost = address_cost (reg, SImode);
 768
 769   copy_cost = COSTS_N_INSNS (1);
 770 }
 771 \f
 772 /* Compute the mapping from uids to luids.
 773    LUIDs are numbers assigned to insns, like uids,
 774    except that luids increase monotonically through the code.
 775    Start at insn START and stop just before END.  Assign LUIDs
 776    starting with PREV_LUID + 1.  Return the last assigned LUID + 1.  */
 777 static int
 778 compute_luids (rtx start, rtx end, int prev_luid)
 779 {
 780   int i;
 781   rtx insn;
 782
 783   for (insn = start, i = prev_luid; insn != end; insn = NEXT_INSN (insn))
 784     {
 785       if (INSN_UID (insn) >= max_uid_for_loop)
 786         continue;
 787       /* Don't assign luids to line-number NOTEs, so that the distance in
 788          luids between two insns is not affected by -g.  */
 789       if (!NOTE_P (insn)
 790           || NOTE_LINE_NUMBER (insn) <= 0)
 791         uid_luid[INSN_UID (insn)] = ++i;
 792       else
 793         /* Give a line number note the same luid as preceding insn.  */
 794         uid_luid[INSN_UID (insn)] = i;
 795     }
 796   return i + 1;
 797 }
 798 \f
 799 /* Entry point of this file.  Perform loop optimization
 800    on the current function.  F is the first insn of the function
 801    and DUMPFILE is a stream for output of a trace of actions taken
 802    (or 0 if none should be output).  */
 803
 804 void
 805 loop_optimize (rtx f, FILE *dumpfile, int flags)
 806 {
 807   rtx insn;
 808   int i;
 809   struct loops loops_data;
 810   struct loops *loops = &loops_data;
 811   struct loop_info *loops_info;
 812
 813   loop_dump_stream = dumpfile;
 814
 815   init_recog_no_volatile ();
 816
 817   max_reg_before_loop = max_reg_num ();
 818   loop_max_reg = max_reg_before_loop;
 819
 820   regs_may_share = 0;
 821
 822   /* Count the number of loops.  */
 823
 824   max_loop_num = 0;
 825   for (insn = f; insn; insn = NEXT_INSN (insn))
 826     {
 827       if (NOTE_P (insn)
 828           && NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
 829         max_loop_num++;
 830     }
 831
 832   /* Don't waste time if no loops.  */
 833   if (max_loop_num == 0)
 834     return;
 835
 836   loops->num = max_loop_num;
 837
 838   /* Get size to use for tables indexed by uids.
 839      Leave some space for labels allocated by find_and_verify_loops.  */
 840   max_uid_for_loop = get_max_uid () + 1 + max_loop_num * 32;
 841
 842   uid_luid = xcalloc (max_uid_for_loop, sizeof (int));
 843   uid_loop = xcalloc (max_uid_for_loop, sizeof (struct loop *));
 844
 845   /* Allocate storage for array of loops.  */
 846   loops->array = xcalloc (loops->num, sizeof (struct loop));
 847
 848   /* Find and process each loop.
 849      First, find them, and record them in order of their beginnings.  */
 850   find_and_verify_loops (f, loops);
 851
 852   /* Allocate and initialize auxiliary loop information.  */
 853   loops_info = xcalloc (loops->num, sizeof (struct loop_info));
 854   for (i = 0; i < (int) loops->num; i++)
 855     loops->array[i].aux = loops_info + i;
 856
 857   /* Now find all register lifetimes.  This must be done after
 858      find_and_verify_loops, because it might reorder the insns in the
 859      function.  */
 860   reg_scan (f, max_reg_before_loop);
 861
 862   /* This must occur after reg_scan so that registers created by gcse
 863      will have entries in the register tables.
 864
 865      We could have added a call to reg_scan after gcse_main in toplev.c,
 866      but moving this call to init_alias_analysis is more efficient.  */
 867   init_alias_analysis ();
 868
 869   /* See if we went too far.  Note that get_max_uid already returns
 870      one more that the maximum uid of all insn.  */
 871   gcc_assert (get_max_uid () <= max_uid_for_loop);
 872   /* Now reset it to the actual size we need.  See above.  */
 873   max_uid_for_loop = get_max_uid ();
 874
 875   /* find_and_verify_loops has already called compute_luids, but it
 876      might have rearranged code afterwards, so we need to recompute
 877      the luids now.  */
 878   compute_luids (f, NULL_RTX, 0);
 879
 880   /* Don't leave gaps in uid_luid for insns that have been
 881      deleted.  It is possible that the first or last insn
 882      using some register has been deleted by cross-jumping.
 883      Make sure that uid_luid for that former insn's uid
 884      points to the general area where that insn used to be.  */
 885   for (i = 0; i < max_uid_for_loop; i++)
 886     {
 887       uid_luid[0] = uid_luid[i];
 888       if (uid_luid[0] != 0)
 889         break;
 890     }
 891   for (i = 0; i < max_uid_for_loop; i++)
 892     if (uid_luid[i] == 0)
 893       uid_luid[i] = uid_luid[i - 1];
 894
 895   /* Determine if the function has indirect jump.  On some systems
 896      this prevents low overhead loop instructions from being used.  */
 897   indirect_jump_in_function = indirect_jump_in_function_p (f);
 898
 899   /* Now scan the loops, last ones first, since this means inner ones are done
 900      before outer ones.  */
 901   for (i = max_loop_num - 1; i >= 0; i--)
 902     {
 903       struct loop *loop = &loops->array[i];
 904
 905       if (! loop->invalid && loop->end)
 906         {
 907           scan_loop (loop, flags);
 908           ggc_collect ();
 909         }
 910     }
 911
 912   end_alias_analysis ();
 913
 914   /* Clean up.  */
 915   for (i = 0; i < (int) loops->num; i++)
 916     free (loops_info[i].mems);
 917
 918   free (uid_luid);
 919   free (uid_loop);
 920   free (loops_info);
 921   free (loops->array);
 922 }
 923 \f
 924 /* Returns the next insn, in execution order, after INSN.  START and
 925    END are the NOTE_INSN_LOOP_BEG and NOTE_INSN_LOOP_END for the loop,
 926    respectively.  LOOP->TOP, if non-NULL, is the top of the loop in the
 927    insn-stream; it is used with loops that are entered near the
 928    bottom.  */
 929
 930 static rtx
 931 next_insn_in_loop (const struct loop *loop, rtx insn)
 932 {
 933   insn = NEXT_INSN (insn);
 934
 935   if (insn == loop->end)
 936     {
 937       if (loop->top)
 938         /* Go to the top of the loop, and continue there.  */
 939         insn = loop->top;
 940       else
 941         /* We're done.  */
 942         insn = NULL_RTX;
 943     }
 944
 945   if (insn == loop->scan_start)
 946     /* We're done.  */
 947     insn = NULL_RTX;
 948
 949   return insn;
 950 }
 951
 952 /* Find any register references hidden inside X and add them to
 953    the dependency list DEPS.  This is used to look inside CLOBBER (MEM
 954    when checking whether a PARALLEL can be pulled out of a loop.  */
 955
 956 static rtx
 957 find_regs_nested (rtx deps, rtx x)
 958 {
 959   enum rtx_code code = GET_CODE (x);
 960   if (code == REG)
 961     deps = gen_rtx_EXPR_LIST (VOIDmode, x, deps);
 962   else
 963     {
 964       const char *fmt = GET_RTX_FORMAT (code);
 965       int i, j;
 966       for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
 967         {
 968           if (fmt[i] == 'e')
 969             deps = find_regs_nested (deps, XEXP (x, i));
 970           else if (fmt[i] == 'E')
 971             for (j = 0; j < XVECLEN (x, i); j++)
 972               deps = find_regs_nested (deps, XVECEXP (x, i, j));
 973         }
 974     }
 975   return deps;
 976 }
 977
 978 /* Optimize one loop described by LOOP.  */
 979
 980 /* ??? Could also move memory writes out of loops if the destination address
 981    is invariant, the source is invariant, the memory write is not volatile,
 982    and if we can prove that no read inside the loop can read this address
 983    before the write occurs.  If there is a read of this address after the
 984    write, then we can also mark the memory read as invariant.  */
 985
 986 static void
 987 scan_loop (struct loop *loop, int flags)
 988 {
 989   struct loop_info *loop_info = LOOP_INFO (loop);
 990   struct loop_regs *regs = LOOP_REGS (loop);
 991   int i;
 992   rtx loop_start = loop->start;
 993   rtx loop_end = loop->end;
 994   rtx p;
 995   /* 1 if we are scanning insns that could be executed zero times.  */
 996   int maybe_never = 0;
 997   /* 1 if we are scanning insns that might never be executed
 998      due to a subroutine call which might exit before they are reached.  */
 999   int call_passed = 0;
1000   /* Number of insns in the loop.  */
1001   int insn_count;
1002   int tem;
1003   rtx temp, update_start, update_end;
1004   /* The SET from an insn, if it is the only SET in the insn.  */
1005   rtx set, set1;
1006   /* Chain describing insns movable in current loop.  */
1007   struct loop_movables *movables = LOOP_MOVABLES (loop);
1008   /* Ratio of extra register life span we can justify
1009      for saving an instruction.  More if loop doesn't call subroutines
1010      since in that case saving an insn makes more difference
1011      and more registers are available.  */
1012   int threshold;
1013   int in_libcall;
1014
1015   loop->top = 0;
1016
1017   movables->head = 0;
1018   movables->last = 0;
1019
1020   /* Determine whether this loop starts with a jump down to a test at
1021      the end.  This will occur for a small number of loops with a test
1022      that is too complex to duplicate in front of the loop.
1023
1024      We search for the first insn or label in the loop, skipping NOTEs.
1025      However, we must be careful not to skip past a NOTE_INSN_LOOP_BEG
1026      (because we might have a loop executed only once that contains a
1027      loop which starts with a jump to its exit test) or a NOTE_INSN_LOOP_END
1028      (in case we have a degenerate loop).
1029
1030      Note that if we mistakenly think that a loop is entered at the top
1031      when, in fact, it is entered at the exit test, the only effect will be
1032      slightly poorer optimization.  Making the opposite error can generate
1033      incorrect code.  Since very few loops now start with a jump to the
1034      exit test, the code here to detect that case is very conservative.  */
1035
1036   for (p = NEXT_INSN (loop_start);
1037        p != loop_end
1038          && !LABEL_P (p) && ! INSN_P (p)
1039          && (!NOTE_P (p)
1040              || (NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_BEG
1041                  && NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_END));
1042        p = NEXT_INSN (p))
1043     ;
1044
1045   loop->scan_start = p;
1046
1047   /* If loop end is the end of the current function, then emit a
1048      NOTE_INSN_DELETED after loop_end and set loop->sink to the dummy
1049      note insn.  This is the position we use when sinking insns out of
1050      the loop.  */
1051   if (NEXT_INSN (loop->end) != 0)
1052     loop->sink = NEXT_INSN (loop->end);
1053   else
1054     loop->sink = emit_note_after (NOTE_INSN_DELETED, loop->end);
1055
1056   /* Set up variables describing this loop.  */
1057   prescan_loop (loop);
1058   threshold = (loop_info->has_call ? 1 : 2) * (1 + n_non_fixed_regs);
1059
1060   /* If loop has a jump before the first label,
1061      the true entry is the target of that jump.
1062      Start scan from there.
1063      But record in LOOP->TOP the place where the end-test jumps
1064      back to so we can scan that after the end of the loop.  */
1065   if (JUMP_P (p)
1066       /* Loop entry must be unconditional jump (and not a RETURN)  */
1067       && any_uncondjump_p (p)
1068       && JUMP_LABEL (p) != 0
1069       /* Check to see whether the jump actually
1070          jumps out of the loop (meaning it's no loop).
1071          This case can happen for things like
1072          do {..} while (0).  If this label was generated previously
1073          by loop, we can't tell anything about it and have to reject
1074          the loop.  */
1075       && INSN_IN_RANGE_P (JUMP_LABEL (p), loop_start, loop_end))
1076     {
1077       loop->top = next_label (loop->scan_start);
1078       loop->scan_start = JUMP_LABEL (p);
1079     }
1080
1081   /* If LOOP->SCAN_START was an insn created by loop, we don't know its luid
1082      as required by loop_reg_used_before_p.  So skip such loops.  (This
1083      test may never be true, but it's best to play it safe.)
1084
1085      Also, skip loops where we do not start scanning at a label.  This
1086      test also rejects loops starting with a JUMP_INSN that failed the
1087      test above.  */
1088
1089   if (INSN_UID (loop->scan_start) >= max_uid_for_loop
1090       || !LABEL_P (loop->scan_start))
1091     {
1092       if (loop_dump_stream)
1093         fprintf (loop_dump_stream, "\nLoop from %d to %d is phony.\n\n",
1094                  INSN_UID (loop_start), INSN_UID (loop_end));
1095       return;
1096     }
1097
1098   /* Allocate extra space for REGs that might be created by load_mems.
1099      We allocate a little extra slop as well, in the hopes that we
1100      won't have to reallocate the regs array.  */
1101   loop_regs_scan (loop, loop_info->mems_idx + 16);
1102   insn_count = count_insns_in_loop (loop);
1103
1104   if (loop_dump_stream)
1105     fprintf (loop_dump_stream, "\nLoop from %d to %d: %d real insns.\n",
1106              INSN_UID (loop_start), INSN_UID (loop_end), insn_count);
1107
1108   /* Scan through the loop finding insns that are safe to move.
1109      Set REGS->ARRAY[I].SET_IN_LOOP negative for the reg I being set, so that
1110      this reg will be considered invariant for subsequent insns.
1111      We consider whether subsequent insns use the reg
1112      in deciding whether it is worth actually moving.
1113
1114      MAYBE_NEVER is nonzero if we have passed a conditional jump insn
1115      and therefore it is possible that the insns we are scanning
1116      would never be executed.  At such times, we must make sure
1117      that it is safe to execute the insn once instead of zero times.
1118      When MAYBE_NEVER is 0, all insns will be executed at least once
1119      so that is not a problem.  */
1120
1121   for (in_libcall = 0, p = next_insn_in_loop (loop, loop->scan_start);
1122        p != NULL_RTX;
1123        p = next_insn_in_loop (loop, p))
1124     {
1125       if (in_libcall && INSN_P (p) && find_reg_note (p, REG_RETVAL, NULL_RTX))
1126         in_libcall--;
1127       if (NONJUMP_INSN_P (p))
1128         {
1129           /* Do not scan past an optimization barrier.  */
1130           if (GET_CODE (PATTERN (p)) == ASM_INPUT)
1131             break;
1132           temp = find_reg_note (p, REG_LIBCALL, NULL_RTX);
1133           if (temp)
1134             in_libcall++;
1135           if (! in_libcall
1136               && (set = single_set (p))
1137               && REG_P (SET_DEST (set))
1138 #ifdef PIC_OFFSET_TABLE_REG_CALL_CLOBBERED
1139               && SET_DEST (set) != pic_offset_table_rtx
1140 #endif
1141               && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
1142             {
1143               int tem1 = 0;
1144               int tem2 = 0;
1145               int move_insn = 0;
1146               int insert_temp = 0;
1147               rtx src = SET_SRC (set);
1148               rtx dependencies = 0;
1149
1150               /* Figure out what to use as a source of this insn.  If a
1151                  REG_EQUIV note is given or if a REG_EQUAL note with a
1152                  constant operand is specified, use it as the source and
1153                  mark that we should move this insn by calling
1154                  emit_move_insn rather that duplicating the insn.
1155
1156                  Otherwise, only use the REG_EQUAL contents if a REG_RETVAL
1157                  note is present.  */
1158               temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
1159               if (temp)
1160                 src = XEXP (temp, 0), move_insn = 1;
1161               else
1162                 {
1163                   temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
1164                   if (temp && CONSTANT_P (XEXP (temp, 0)))
1165                     src = XEXP (temp, 0), move_insn = 1;
1166                   if (temp && find_reg_note (p, REG_RETVAL, NULL_RTX))
1167                     {
1168                       src = XEXP (temp, 0);
1169                       /* A libcall block can use regs that don't appear in
1170                          the equivalent expression.  To move the libcall,
1171                          we must move those regs too.  */
1172                       dependencies = libcall_other_reg (p, src);
1173                     }
1174                 }
1175
1176               /* For parallels, add any possible uses to the dependencies, as
1177                  we can't move the insn without resolving them first.
1178                  MEMs inside CLOBBERs may also reference registers; these
1179                  count as implicit uses.  */
1180               if (GET_CODE (PATTERN (p)) == PARALLEL)
1181                 {
1182                   for (i = 0; i < XVECLEN (PATTERN (p), 0); i++)
1183                     {
1184                       rtx x = XVECEXP (PATTERN (p), 0, i);
1185                       if (GET_CODE (x) == USE)
1186                         dependencies
1187                           = gen_rtx_EXPR_LIST (VOIDmode, XEXP (x, 0),
1188                                                dependencies);
1189                       else if (GET_CODE (x) == CLOBBER
1190                                && MEM_P (XEXP (x, 0)))
1191                         dependencies = find_regs_nested (dependencies,
1192                                                   XEXP (XEXP (x, 0), 0));
1193                     }
1194                 }
1195
1196               if (/* The register is used in basic blocks other
1197                       than the one where it is set (meaning that
1198                       something after this point in the loop might
1199                       depend on its value before the set).  */
1200                    ! reg_in_basic_block_p (p, SET_DEST (set))
1201                    /* And the set is not guaranteed to be executed once
1202                       the loop starts, or the value before the set is
1203                       needed before the set occurs...
1204
1205                       ??? Note we have quadratic behavior here, mitigated
1206                       by the fact that the previous test will often fail for
1207                       large loops.  Rather than re-scanning the entire loop
1208                       each time for register usage, we should build tables
1209                       of the register usage and use them here instead.  */
1210                    && (maybe_never
1211                        || loop_reg_used_before_p (loop, set, p)))
1212                 /* It is unsafe to move the set.  However, it may be OK to
1213                    move the source into a new pseudo, and substitute a
1214                    reg-to-reg copy for the original insn.
1215
1216                    This code used to consider it OK to move a set of a variable
1217                    which was not created by the user and not used in an exit
1218                    test.
1219                    That behavior is incorrect and was removed.  */
1220                 insert_temp = 1;
1221
1222               /* Don't try to optimize a MODE_CC set with a constant
1223                  source.  It probably will be combined with a conditional
1224                  jump.  */
1225               if (GET_MODE_CLASS (GET_MODE (SET_DEST (set))) == MODE_CC
1226                   && CONSTANT_P (src))
1227                 ;
1228               /* Don't try to optimize a register that was made
1229                  by loop-optimization for an inner loop.
1230                  We don't know its life-span, so we can't compute
1231                  the benefit.  */
1232               else if (REGNO (SET_DEST (set)) >= max_reg_before_loop)
1233                 ;
1234               /* Don't move the source and add a reg-to-reg copy:
1235                  - with -Os (this certainly increases size),
1236                  - if the mode doesn't support copy operations (obviously),
1237                  - if the source is already a reg (the motion will gain nothing),
1238                  - if the source is a legitimate constant (likewise).  */
1239               else if (insert_temp
1240                        && (optimize_size
1241                            || ! can_copy_p (GET_MODE (SET_SRC (set)))
1242                            || REG_P (SET_SRC (set))
1243                            || (CONSTANT_P (SET_SRC (set))
1244                                && LEGITIMATE_CONSTANT_P (SET_SRC (set)))))
1245                 ;
1246               else if ((tem = loop_invariant_p (loop, src))
1247                        && (dependencies == 0
1248                            || (tem2
1249                                = loop_invariant_p (loop, dependencies)) != 0)
1250                        && (regs->array[REGNO (SET_DEST (set))].set_in_loop == 1
1251                            || (tem1
1252                                = consec_sets_invariant_p
1253                                (loop, SET_DEST (set),
1254                                 regs->array[REGNO (SET_DEST (set))].set_in_loop,
1255                                 p)))
1256                        /* If the insn can cause a trap (such as divide by zero),
1257                           can't move it unless it's guaranteed to be executed
1258                           once loop is entered.  Even a function call might
1259                           prevent the trap insn from being reached
1260                           (since it might exit!)  */
1261                        && ! ((maybe_never || call_passed)
1262                              && may_trap_p (src)))
1263                 {
1264                   struct movable *m;
1265                   int regno = REGNO (SET_DEST (set));
1266
1267                   /* A potential lossage is where we have a case where two insns
1268                      can be combined as long as they are both in the loop, but
1269                      we move one of them outside the loop.  For large loops,
1270                      this can lose.  The most common case of this is the address
1271                      of a function being called.
1272
1273                      Therefore, if this register is marked as being used
1274                      exactly once if we are in a loop with calls
1275                      (a "large loop"), see if we can replace the usage of
1276                      this register with the source of this SET.  If we can,
1277                      delete this insn.
1278
1279                      Don't do this if P has a REG_RETVAL note or if we have
1280                      SMALL_REGISTER_CLASSES and SET_SRC is a hard register.  */
1281
1282                   if (loop_info->has_call
1283                       && regs->array[regno].single_usage != 0
1284                       && regs->array[regno].single_usage != const0_rtx
1285                       && REGNO_FIRST_UID (regno) == INSN_UID (p)
1286                       && (REGNO_LAST_UID (regno)
1287                           == INSN_UID (regs->array[regno].single_usage))
1288                       && regs->array[regno].set_in_loop == 1
1289                       && GET_CODE (SET_SRC (set)) != ASM_OPERANDS
1290                       && ! side_effects_p (SET_SRC (set))
1291                       && ! find_reg_note (p, REG_RETVAL, NULL_RTX)
1292                       && (! SMALL_REGISTER_CLASSES
1293                           || (! (REG_P (SET_SRC (set))
1294                                  && (REGNO (SET_SRC (set))
1295                                      < FIRST_PSEUDO_REGISTER))))
1296                       && regno >= FIRST_PSEUDO_REGISTER
1297                       /* This test is not redundant; SET_SRC (set) might be
1298                          a call-clobbered register and the life of REGNO
1299                          might span a call.  */
1300                       && ! modified_between_p (SET_SRC (set), p,
1301                                                regs->array[regno].single_usage)
1302                       && no_labels_between_p (p,
1303                                               regs->array[regno].single_usage)
1304                       && validate_replace_rtx (SET_DEST (set), SET_SRC (set),
1305                                                regs->array[regno].single_usage))
1306                     {
1307                       /* Replace any usage in a REG_EQUAL note.  Must copy
1308                          the new source, so that we don't get rtx sharing
1309                          between the SET_SOURCE and REG_NOTES of insn p.  */
1310                       REG_NOTES (regs->array[regno].single_usage)
1311                         = (replace_rtx
1312                            (REG_NOTES (regs->array[regno].single_usage),
1313                             SET_DEST (set), copy_rtx (SET_SRC (set))));
1314
1315                       delete_insn (p);
1316                       for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set));
1317                            i++)
1318                         regs->array[regno+i].set_in_loop = 0;
1319                       continue;
1320                     }
1321
1322                   m = xmalloc (sizeof (struct movable));
1323                   m->next = 0;
1324                   m->insn = p;
1325                   m->set_src = src;
1326                   m->dependencies = dependencies;
1327                   m->set_dest = SET_DEST (set);
1328                   m->force = 0;
1329                   m->consec
1330                     = regs->array[REGNO (SET_DEST (set))].set_in_loop - 1;
1331                   m->done = 0;
1332                   m->forces = 0;
1333                   m->partial = 0;
1334                   m->move_insn = move_insn;
1335                   m->move_insn_first = 0;
1336                   m->insert_temp = insert_temp;
1337                   m->is_equiv = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
1338                   m->savemode = VOIDmode;
1339                   m->regno = regno;
1340                   /* Set M->cond if either loop_invariant_p
1341                      or consec_sets_invariant_p returned 2
1342                      (only conditionally invariant).  */
1343                   m->cond = ((tem | tem1 | tem2) > 1);
1344                   m->global =  LOOP_REG_GLOBAL_P (loop, regno);
1345                   m->match = 0;
1346                   m->lifetime = LOOP_REG_LIFETIME (loop, regno);
1347                   m->savings = regs->array[regno].n_times_set;
1348                   if (find_reg_note (p, REG_RETVAL, NULL_RTX))
1349                     m->savings += libcall_benefit (p);
1350                   for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set)); i++)
1351                     regs->array[regno+i].set_in_loop = move_insn ? -2 : -1;
1352                   /* Add M to the end of the chain MOVABLES.  */
1353                   loop_movables_add (movables, m);
1354
1355                   if (m->consec > 0)
1356                     {
1357                       /* It is possible for the first instruction to have a
1358                          REG_EQUAL note but a non-invariant SET_SRC, so we must
1359                          remember the status of the first instruction in case
1360                          the last instruction doesn't have a REG_EQUAL note.  */
1361                       m->move_insn_first = m->move_insn;
1362
1363                       /* Skip this insn, not checking REG_LIBCALL notes.  */
1364                       p = next_nonnote_insn (p);
1365                       /* Skip the consecutive insns, if there are any.  */
1366                       p = skip_consec_insns (p, m->consec);
1367                       /* Back up to the last insn of the consecutive group.  */
1368                       p = prev_nonnote_insn (p);
1369
1370                       /* We must now reset m->move_insn, m->is_equiv, and
1371                          possibly m->set_src to correspond to the effects of
1372                          all the insns.  */
1373                       temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
1374                       if (temp)
1375                         m->set_src = XEXP (temp, 0), m->move_insn = 1;
1376                       else
1377                         {
1378                           temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
1379                           if (temp && CONSTANT_P (XEXP (temp, 0)))
1380                             m->set_src = XEXP (temp, 0), m->move_insn = 1;
1381                           else
1382                             m->move_insn = 0;
1383
1384                         }
1385                       m->is_equiv
1386                         = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
1387                     }
1388                 }
1389               /* If this register is always set within a STRICT_LOW_PART
1390                  or set to zero, then its high bytes are constant.
1391                  So clear them outside the loop and within the loop
1392                  just load the low bytes.
1393                  We must check that the machine has an instruction to do so.
1394                  Also, if the value loaded into the register
1395                  depends on the same register, this cannot be done.  */
1396               else if (SET_SRC (set) == const0_rtx
1397                        && NONJUMP_INSN_P (NEXT_INSN (p))
1398                        && (set1 = single_set (NEXT_INSN (p)))
1399                        && GET_CODE (set1) == SET
1400                        && (GET_CODE (SET_DEST (set1)) == STRICT_LOW_PART)
1401                        && (GET_CODE (XEXP (SET_DEST (set1), 0)) == SUBREG)
1402                        && (SUBREG_REG (XEXP (SET_DEST (set1), 0))
1403                            == SET_DEST (set))
1404                        && !reg_mentioned_p (SET_DEST (set), SET_SRC (set1)))
1405                 {
1406                   int regno = REGNO (SET_DEST (set));
1407                   if (regs->array[regno].set_in_loop == 2)
1408                     {
1409                       struct movable *m;
1410                       m = xmalloc (sizeof (struct movable));
1411                       m->next = 0;
1412                       m->insn = p;
1413                       m->set_dest = SET_DEST (set);
1414                       m->dependencies = 0;
1415                       m->force = 0;
1416                       m->consec = 0;
1417                       m->done = 0;
1418                       m->forces = 0;
1419                       m->move_insn = 0;
1420                       m->move_insn_first = 0;
1421                       m->insert_temp = insert_temp;
1422                       m->partial = 1;
1423                       /* If the insn may not be executed on some cycles,
1424                          we can't clear the whole reg; clear just high part.
1425                          Not even if the reg is used only within this loop.
1426                          Consider this:
1427                          while (1)
1428                            while (s != t) {
1429                              if (foo ()) x = *s;
1430                              use (x);
1431                            }
1432                          Clearing x before the inner loop could clobber a value
1433                          being saved from the last time around the outer loop.
1434                          However, if the reg is not used outside this loop
1435                          and all uses of the register are in the same
1436                          basic block as the store, there is no problem.
1437
1438                          If this insn was made by loop, we don't know its
1439                          INSN_LUID and hence must make a conservative
1440                          assumption.  */
1441                       m->global = (INSN_UID (p) >= max_uid_for_loop
1442                                    || LOOP_REG_GLOBAL_P (loop, regno)
1443                                    || (labels_in_range_p
1444                                        (p, REGNO_FIRST_LUID (regno))));
1445                       if (maybe_never && m->global)
1446                         m->savemode = GET_MODE (SET_SRC (set1));
1447                       else
1448                         m->savemode = VOIDmode;
1449                       m->regno = regno;
1450                       m->cond = 0;
1451                       m->match = 0;
1452                       m->lifetime = LOOP_REG_LIFETIME (loop, regno);
1453                       m->savings = 1;
1454                       for (i = 0;
1455                            i < LOOP_REGNO_NREGS (regno, SET_DEST (set));
1456                            i++)
1457                         regs->array[regno+i].set_in_loop = -1;
1458                       /* Add M to the end of the chain MOVABLES.  */
1459                       loop_movables_add (movables, m);
1460                     }
1461                 }
1462             }
1463         }
1464       /* Past a call insn, we get to insns which might not be executed
1465          because the call might exit.  This matters for insns that trap.
1466          Constant and pure call insns always return, so they don't count.  */
1467       else if (CALL_P (p) && ! CONST_OR_PURE_CALL_P (p))
1468         call_passed = 1;
1469       /* Past a label or a jump, we get to insns for which we
1470          can't count on whether or how many times they will be
1471          executed during each iteration.  Therefore, we can
1472          only move out sets of trivial variables
1473          (those not used after the loop).  */
1474       /* Similar code appears twice in strength_reduce.  */
1475       else if ((LABEL_P (p) || JUMP_P (p))
1476                /* If we enter the loop in the middle, and scan around to the
1477                   beginning, don't set maybe_never for that.  This must be an
1478                   unconditional jump, otherwise the code at the top of the
1479                   loop might never be executed.  Unconditional jumps are
1480                   followed by a barrier then the loop_end.  */
1481                && ! (JUMP_P (p) && JUMP_LABEL (p) == loop->top
1482                      && NEXT_INSN (NEXT_INSN (p)) == loop_end
1483                      && any_uncondjump_p (p)))
1484         maybe_never = 1;
1485     }
1486
1487   /* If one movable subsumes another, ignore that other.  */
1488
1489   ignore_some_movables (movables);
1490
1491   /* For each movable insn, see if the reg that it loads
1492      leads when it dies right into another conditionally movable insn.
1493      If so, record that the second insn "forces" the first one,
1494      since the second can be moved only if the first is.  */
1495
1496   force_movables (movables);
1497
1498   /* See if there are multiple movable insns that load the same value.
1499      If there are, make all but the first point at the first one
1500      through the `match' field, and add the priorities of them
1501      all together as the priority of the first.  */
1502
1503   combine_movables (movables, regs);
1504
1505   /* Now consider each movable insn to decide whether it is worth moving.
1506      Store 0 in regs->array[I].set_in_loop for each reg I that is moved.
1507
1508      For machines with few registers this increases code size, so do not
1509      move moveables when optimizing for code size on such machines.
1510      (The 18 below is the value for i386.)  */
1511
1512   if (!optimize_size
1513       || (reg_class_size[GENERAL_REGS] > 18 && !loop_info->has_call))
1514     {
1515       move_movables (loop, movables, threshold, insn_count);
1516
1517       /* Recalculate regs->array if move_movables has created new
1518          registers.  */
1519       if (max_reg_num () > regs->num)
1520         {
1521           loop_regs_scan (loop, 0);
1522           for (update_start = loop_start;
1523                PREV_INSN (update_start)
1524                && !LABEL_P (PREV_INSN (update_start));
1525                update_start = PREV_INSN (update_start))
1526             ;
1527           update_end = NEXT_INSN (loop_end);
1528
1529           reg_scan_update (update_start, update_end, loop_max_reg);
1530           loop_max_reg = max_reg_num ();
1531         }
1532     }
1533
1534   /* Now candidates that still are negative are those not moved.
1535      Change regs->array[I].set_in_loop to indicate that those are not actually
1536      invariant.  */
1537   for (i = 0; i < regs->num; i++)
1538     if (regs->array[i].set_in_loop < 0)
1539       regs->array[i].set_in_loop = regs->array[i].n_times_set;
1540
1541   /* Now that we've moved some things out of the loop, we might be able to
1542      hoist even more memory references.  */
1543   load_mems (loop);
1544
1545   /* Recalculate regs->array if load_mems has created new registers.  */
1546   if (max_reg_num () > regs->num)
1547     loop_regs_scan (loop, 0);
1548
1549   for (update_start = loop_start;
1550        PREV_INSN (update_start)
1551          && !LABEL_P (PREV_INSN (update_start));
1552        update_start = PREV_INSN (update_start))
1553     ;
1554   update_end = NEXT_INSN (loop_end);
1555
1556   reg_scan_update (update_start, update_end, loop_max_reg);
1557   loop_max_reg = max_reg_num ();
1558
1559   if (flag_strength_reduce)
1560     {
1561       if (update_end && LABEL_P (update_end))
1562         /* Ensure our label doesn't go away.  */
1563         LABEL_NUSES (update_end)++;
1564
1565       strength_reduce (loop, flags);
1566
1567       reg_scan_update (update_start, update_end, loop_max_reg);
1568       loop_max_reg = max_reg_num ();
1569
1570       if (update_end && LABEL_P (update_end)
1571           && --LABEL_NUSES (update_end) == 0)
1572         delete_related_insns (update_end);
1573     }
1574
1575
1576   /* The movable information is required for strength reduction.  */
1577   loop_movables_free (movables);
1578
1579   free (regs->array);
1580   regs->array = 0;
1581   regs->num = 0;
1582 }
1583 \f
1584 /* Add elements to *OUTPUT to record all the pseudo-regs
1585    mentioned in IN_THIS but not mentioned in NOT_IN_THIS.  */
1586
1587 static void
1588 record_excess_regs (rtx in_this, rtx not_in_this, rtx *output)
1589 {
1590   enum rtx_code code;
1591   const char *fmt;
1592   int i;
1593
1594   code = GET_CODE (in_this);
1595
1596   switch (code)
1597     {
1598     case PC:
1599     case CC0:
1600     case CONST_INT:
1601     case CONST_DOUBLE:
1602     case CONST:
1603     case SYMBOL_REF:
1604     case LABEL_REF:
1605       return;
1606
1607     case REG:
1608       if (REGNO (in_this) >= FIRST_PSEUDO_REGISTER
1609           && ! reg_mentioned_p (in_this, not_in_this))
1610         *output = gen_rtx_EXPR_LIST (VOIDmode, in_this, *output);
1611       return;
1612
1613     default:
1614       break;
1615     }
1616
1617   fmt = GET_RTX_FORMAT (code);
1618   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1619     {
1620       int j;
1621
1622       switch (fmt[i])
1623         {
1624         case 'E':
1625           for (j = 0; j < XVECLEN (in_this, i); j++)
1626             record_excess_regs (XVECEXP (in_this, i, j), not_in_this, output);
1627           break;
1628
1629         case 'e':
1630           record_excess_regs (XEXP (in_this, i), not_in_this, output);
1631           break;
1632         }
1633     }
1634 }
1635 \f
1636 /* Check what regs are referred to in the libcall block ending with INSN,
1637    aside from those mentioned in the equivalent value.
1638    If there are none, return 0.
1639    If there are one or more, return an EXPR_LIST containing all of them.  */
1640
1641 static rtx
1642 libcall_other_reg (rtx insn, rtx equiv)
1643 {
1644   rtx note = find_reg_note (insn, REG_RETVAL, NULL_RTX);
1645   rtx p = XEXP (note, 0);
1646   rtx output = 0;
1647
1648   /* First, find all the regs used in the libcall block
1649      that are not mentioned as inputs to the result.  */
1650
1651   while (p != insn)
1652     {
1653       if (INSN_P (p))
1654         record_excess_regs (PATTERN (p), equiv, &output);
1655       p = NEXT_INSN (p);
1656     }
1657
1658   return output;
1659 }
1660 \f
1661 /* Return 1 if all uses of REG
1662    are between INSN and the end of the basic block.  */
1663
1664 static int
1665 reg_in_basic_block_p (rtx insn, rtx reg)
1666 {
1667   int regno = REGNO (reg);
1668   rtx p;
1669
1670   if (REGNO_FIRST_UID (regno) != INSN_UID (insn))
1671     return 0;
1672
1673   /* Search this basic block for the already recorded last use of the reg.  */
1674   for (p = insn; p; p = NEXT_INSN (p))
1675     {
1676       switch (GET_CODE (p))
1677         {
1678         case NOTE:
1679           break;
1680
1681         case INSN:
1682         case CALL_INSN:
1683           /* Ordinary insn: if this is the last use, we win.  */
1684           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1685             return 1;
1686           break;
1687
1688         case JUMP_INSN:
1689           /* Jump insn: if this is the last use, we win.  */
1690           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1691             return 1;
1692           /* Otherwise, it's the end of the basic block, so we lose.  */
1693           return 0;
1694
1695         case CODE_LABEL:
1696         case BARRIER:
1697           /* It's the end of the basic block, so we lose.  */
1698           return 0;
1699
1700         default:
1701           break;
1702         }
1703     }
1704
1705   /* The "last use" that was recorded can't be found after the first
1706      use.  This can happen when the last use was deleted while
1707      processing an inner loop, this inner loop was then completely
1708      unrolled, and the outer loop is always exited after the inner loop,
1709      so that everything after the first use becomes a single basic block.  */
1710   return 1;
1711 }
1712 \f
1713 /* Compute the benefit of eliminating the insns in the block whose
1714    last insn is LAST.  This may be a group of insns used to compute a
1715    value directly or can contain a library call.  */
1716
1717 static int
1718 libcall_benefit (rtx last)
1719 {
1720   rtx insn;
1721   int benefit = 0;
1722
1723   for (insn = XEXP (find_reg_note (last, REG_RETVAL, NULL_RTX), 0);
1724        insn != last; insn = NEXT_INSN (insn))
1725     {
1726       if (CALL_P (insn))
1727         benefit += 10;          /* Assume at least this many insns in a library
1728                                    routine.  */
1729       else if (NONJUMP_INSN_P (insn)
1730                && GET_CODE (PATTERN (insn)) != USE
1731                && GET_CODE (PATTERN (insn)) != CLOBBER)
1732         benefit++;
1733     }
1734
1735   return benefit;
1736 }
1737 \f
1738 /* Skip COUNT insns from INSN, counting library calls as 1 insn.  */
1739
1740 static rtx
1741 skip_consec_insns (rtx insn, int count)
1742 {
1743   for (; count > 0; count--)
1744     {
1745       rtx temp;
1746
1747       /* If first insn of libcall sequence, skip to end.  */
1748       /* Do this at start of loop, since INSN is guaranteed to
1749          be an insn here.  */
1750       if (!NOTE_P (insn)
1751           && (temp = find_reg_note (insn, REG_LIBCALL, NULL_RTX)))
1752         insn = XEXP (temp, 0);
1753
1754       do
1755         insn = NEXT_INSN (insn);
1756       while (NOTE_P (insn));
1757     }
1758
1759   return insn;
1760 }
1761
1762 /* Ignore any movable whose insn falls within a libcall
1763    which is part of another movable.
1764    We make use of the fact that the movable for the libcall value
1765    was made later and so appears later on the chain.  */
1766
1767 static void
1768 ignore_some_movables (struct loop_movables *movables)
1769 {
1770   struct movable *m, *m1;
1771
1772   for (m = movables->head; m; m = m->next)
1773     {
1774       /* Is this a movable for the value of a libcall?  */
1775       rtx note = find_reg_note (m->insn, REG_RETVAL, NULL_RTX);
1776       if (note)
1777         {
1778           rtx insn;
1779           /* Check for earlier movables inside that range,
1780              and mark them invalid.  We cannot use LUIDs here because
1781              insns created by loop.c for prior loops don't have LUIDs.
1782              Rather than reject all such insns from movables, we just
1783              explicitly check each insn in the libcall (since invariant
1784              libcalls aren't that common).  */
1785           for (insn = XEXP (note, 0); insn != m->insn; insn = NEXT_INSN (insn))
1786             for (m1 = movables->head; m1 != m; m1 = m1->next)
1787               if (m1->insn == insn)
1788                 m1->done = 1;
1789         }
1790     }
1791 }
1792
1793 /* For each movable insn, see if the reg that it loads
1794    leads when it dies right into another conditionally movable insn.
1795    If so, record that the second insn "forces" the first one,
1796    since the second can be moved only if the first is.  */
1797
1798 static void
1799 force_movables (struct loop_movables *movables)
1800 {
1801   struct movable *m, *m1;
1802
1803   for (m1 = movables->head; m1; m1 = m1->next)
1804     /* Omit this if moving just the (SET (REG) 0) of a zero-extend.  */
1805     if (!m1->partial && !m1->done)
1806       {
1807         int regno = m1->regno;
1808         for (m = m1->next; m; m = m->next)
1809           /* ??? Could this be a bug?  What if CSE caused the
1810              register of M1 to be used after this insn?
1811              Since CSE does not update regno_last_uid,
1812              this insn M->insn might not be where it dies.
1813              But very likely this doesn't matter; what matters is
1814              that M's reg is computed from M1's reg.  */
1815           if (INSN_UID (m->insn) == REGNO_LAST_UID (regno)
1816               && !m->done)
1817             break;
1818         if (m != 0 && m->set_src == m1->set_dest
1819             /* If m->consec, m->set_src isn't valid.  */
1820             && m->consec == 0)
1821           m = 0;
1822
1823         /* Increase the priority of the moving the first insn
1824            since it permits the second to be moved as well.
1825            Likewise for insns already forced by the first insn.  */
1826         if (m != 0)
1827           {
1828             struct movable *m2;
1829
1830             m->forces = m1;
1831             for (m2 = m1; m2; m2 = m2->forces)
1832               {
1833                 m2->lifetime += m->lifetime;
1834                 m2->savings += m->savings;
1835               }
1836           }
1837       }
1838 }
1839 \f
1840 /* Find invariant expressions that are equal and can be combined into
1841    one register.  */
1842
1843 static void
1844 combine_movables (struct loop_movables *movables, struct loop_regs *regs)
1845 {
1846   struct movable *m;
1847   char *matched_regs = xmalloc (regs->num);
1848   enum machine_mode mode;
1849
1850   /* Regs that are set more than once are not allowed to match
1851      or be matched.  I'm no longer sure why not.  */
1852   /* Only pseudo registers are allowed to match or be matched,
1853      since move_movables does not validate the change.  */
1854   /* Perhaps testing m->consec_sets would be more appropriate here?  */
1855
1856   for (m = movables->head; m; m = m->next)
1857     if (m->match == 0 && regs->array[m->regno].n_times_set == 1
1858         && m->regno >= FIRST_PSEUDO_REGISTER
1859         && !m->insert_temp
1860         && !m->partial)
1861       {
1862         struct movable *m1;
1863         int regno = m->regno;
1864
1865         memset (matched_regs, 0, regs->num);
1866         matched_regs[regno] = 1;
1867
1868         /* We want later insns to match the first one.  Don't make the first
1869            one match any later ones.  So start this loop at m->next.  */
1870         for (m1 = m->next; m1; m1 = m1->next)
1871           if (m != m1 && m1->match == 0
1872               && !m1->insert_temp
1873               && regs->array[m1->regno].n_times_set == 1
1874               && m1->regno >= FIRST_PSEUDO_REGISTER
1875               /* A reg used outside the loop mustn't be eliminated.  */
1876               && !m1->global
1877               /* A reg used for zero-extending mustn't be eliminated.  */
1878               && !m1->partial
1879               && (matched_regs[m1->regno]
1880                   ||
1881                   (
1882                    /* Can combine regs with different modes loaded from the
1883                       same constant only if the modes are the same or
1884                       if both are integer modes with M wider or the same
1885                       width as M1.  The check for integer is redundant, but
1886                       safe, since the only case of differing destination
1887                       modes with equal sources is when both sources are
1888                       VOIDmode, i.e., CONST_INT.  */
1889                    (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest)
1890                     || (GET_MODE_CLASS (GET_MODE (m->set_dest)) == MODE_INT
1891                         && GET_MODE_CLASS (GET_MODE (m1->set_dest)) == MODE_INT
1892                         && (GET_MODE_BITSIZE (GET_MODE (m->set_dest))
1893                             >= GET_MODE_BITSIZE (GET_MODE (m1->set_dest)))))
1894                    /* See if the source of M1 says it matches M.  */
1895                    && ((REG_P (m1->set_src)
1896                         && matched_regs[REGNO (m1->set_src)])
1897                        || rtx_equal_for_loop_p (m->set_src, m1->set_src,
1898                                                 movables, regs))))
1899               && ((m->dependencies == m1->dependencies)
1900                   || rtx_equal_p (m->dependencies, m1->dependencies)))
1901             {
1902               m->lifetime += m1->lifetime;
1903               m->savings += m1->savings;
1904               m1->done = 1;
1905               m1->match = m;
1906               matched_regs[m1->regno] = 1;
1907             }
1908       }
1909
1910   /* Now combine the regs used for zero-extension.
1911      This can be done for those not marked `global'
1912      provided their lives don't overlap.  */
1913
1914   for (mode = GET_CLASS_NARROWEST_MODE (MODE_INT); mode != VOIDmode;
1915        mode = GET_MODE_WIDER_MODE (mode))
1916     {
1917       struct movable *m0 = 0;
1918
1919       /* Combine all the registers for extension from mode MODE.
1920          Don't combine any that are used outside this loop.  */
1921       for (m = movables->head; m; m = m->next)
1922         if (m->partial && ! m->global
1923             && mode == GET_MODE (SET_SRC (PATTERN (NEXT_INSN (m->insn)))))
1924           {
1925             struct movable *m1;
1926
1927             int first = REGNO_FIRST_LUID (m->regno);
1928             int last = REGNO_LAST_LUID (m->regno);
1929
1930             if (m0 == 0)
1931               {
1932                 /* First one: don't check for overlap, just record it.  */
1933                 m0 = m;
1934                 continue;
1935               }
1936
1937             /* Make sure they extend to the same mode.
1938                (Almost always true.)  */
1939             if (GET_MODE (m->set_dest) != GET_MODE (m0->set_dest))
1940               continue;
1941
1942             /* We already have one: check for overlap with those
1943                already combined together.  */
1944             for (m1 = movables->head; m1 != m; m1 = m1->next)
1945               if (m1 == m0 || (m1->partial && m1->match == m0))
1946                 if (! (REGNO_FIRST_LUID (m1->regno) > last
1947                        || REGNO_LAST_LUID (m1->regno) < first))
1948                   goto overlap;
1949
1950             /* No overlap: we can combine this with the others.  */
1951             m0->lifetime += m->lifetime;
1952             m0->savings += m->savings;
1953             m->done = 1;
1954             m->match = m0;
1955
1956           overlap:
1957             ;
1958           }
1959     }
1960
1961   /* Clean up.  */
1962   free (matched_regs);
1963 }
1964
1965 /* Returns the number of movable instructions in LOOP that were not
1966    moved outside the loop.  */
1967
1968 static int
1969 num_unmoved_movables (const struct loop *loop)
1970 {
1971   int num = 0;
1972   struct movable *m;
1973
1974   for (m = LOOP_MOVABLES (loop)->head; m; m = m->next)
1975     if (!m->done)
1976       ++num;
1977
1978   return num;
1979 }
1980
1981 \f
1982 /* Return 1 if regs X and Y will become the same if moved.  */
1983
1984 static int
1985 regs_match_p (rtx x, rtx y, struct loop_movables *movables)
1986 {
1987   unsigned int xn = REGNO (x);
1988   unsigned int yn = REGNO (y);
1989   struct movable *mx, *my;
1990
1991   for (mx = movables->head; mx; mx = mx->next)
1992     if (mx->regno == xn)
1993       break;
1994
1995   for (my = movables->head; my; my = my->next)
1996     if (my->regno == yn)
1997       break;
1998
1999   return (mx && my
2000           && ((mx->match == my->match && mx->match != 0)
2001               || mx->match == my
2002               || mx == my->match));
2003 }
2004
2005 /* Return 1 if X and Y are identical-looking rtx's.
2006    This is the Lisp function EQUAL for rtx arguments.
2007
2008    If two registers are matching movables or a movable register and an
2009    equivalent constant, consider them equal.  */
2010
2011 static int
2012 rtx_equal_for_loop_p (rtx x, rtx y, struct loop_movables *movables,
2013                       struct loop_regs *regs)
2014 {
2015   int i;
2016   int j;
2017   struct movable *m;
2018   enum rtx_code code;
2019   const char *fmt;
2020
2021   if (x == y)
2022     return 1;
2023   if (x == 0 || y == 0)
2024     return 0;
2025
2026   code = GET_CODE (x);
2027
2028   /* If we have a register and a constant, they may sometimes be
2029      equal.  */
2030   if (REG_P (x) && regs->array[REGNO (x)].set_in_loop == -2
2031       && CONSTANT_P (y))
2032     {
2033       for (m = movables->head; m; m = m->next)
2034         if (m->move_insn && m->regno == REGNO (x)
2035             && rtx_equal_p (m->set_src, y))
2036           return 1;
2037     }
2038   else if (REG_P (y) && regs->array[REGNO (y)].set_in_loop == -2
2039            && CONSTANT_P (x))
2040     {
2041       for (m = movables->head; m; m = m->next)
2042         if (m->move_insn && m->regno == REGNO (y)
2043             && rtx_equal_p (m->set_src, x))
2044           return 1;
2045     }
2046
2047   /* Otherwise, rtx's of different codes cannot be equal.  */
2048   if (code != GET_CODE (y))
2049     return 0;
2050
2051   /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent.
2052      (REG:SI x) and (REG:HI x) are NOT equivalent.  */
2053
2054   if (GET_MODE (x) != GET_MODE (y))
2055     return 0;
2056
2057   /* These three types of rtx's can be compared nonrecursively.  */
2058   if (code == REG)
2059     return (REGNO (x) == REGNO (y) || regs_match_p (x, y, movables));
2060
2061   if (code == LABEL_REF)
2062     return XEXP (x, 0) == XEXP (y, 0);
2063   if (code == SYMBOL_REF)
2064     return XSTR (x, 0) == XSTR (y, 0);
2065
2066   /* Compare the elements.  If any pair of corresponding elements
2067      fail to match, return 0 for the whole things.  */
2068
2069   fmt = GET_RTX_FORMAT (code);
2070   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2071     {
2072       switch (fmt[i])
2073         {
2074         case 'w':
2075           if (XWINT (x, i) != XWINT (y, i))
2076             return 0;
2077           break;
2078
2079         case 'i':
2080           if (XINT (x, i) != XINT (y, i))
2081             return 0;
2082           break;
2083
2084         case 'E':
2085           /* Two vectors must have the same length.  */
2086           if (XVECLEN (x, i) != XVECLEN (y, i))
2087             return 0;
2088
2089           /* And the corresponding elements must match.  */
2090           for (j = 0; j < XVECLEN (x, i); j++)
2091             if (rtx_equal_for_loop_p (XVECEXP (x, i, j), XVECEXP (y, i, j),
2092                                       movables, regs) == 0)
2093               return 0;
2094           break;
2095
2096         case 'e':
2097           if (rtx_equal_for_loop_p (XEXP (x, i), XEXP (y, i), movables, regs)
2098               == 0)
2099             return 0;
2100           break;
2101
2102         case 's':
2103           if (strcmp (XSTR (x, i), XSTR (y, i)))
2104             return 0;
2105           break;
2106
2107         case 'u':
2108           /* These are just backpointers, so they don't matter.  */
2109           break;
2110
2111         case '0':
2112           break;
2113
2114           /* It is believed that rtx's at this level will never
2115              contain anything but integers and other rtx's,
2116              except for within LABEL_REFs and SYMBOL_REFs.  */
2117         default:
2118           gcc_unreachable ();
2119         }
2120     }
2121   return 1;
2122 }
2123 \f
2124 /* If X contains any LABEL_REF's, add REG_LABEL notes for them to all
2125    insns in INSNS which use the reference.  LABEL_NUSES for CODE_LABEL
2126    references is incremented once for each added note.  */
2127
2128 static void
2129 add_label_notes (rtx x, rtx insns)
2130 {
2131   enum rtx_code code = GET_CODE (x);
2132   int i, j;
2133   const char *fmt;
2134   rtx insn;
2135
2136   if (code == LABEL_REF && !LABEL_REF_NONLOCAL_P (x))
2137     {
2138       /* This code used to ignore labels that referred to dispatch tables to
2139          avoid flow generating (slightly) worse code.
2140
2141          We no longer ignore such label references (see LABEL_REF handling in
2142          mark_jump_label for additional information).  */
2143       for (insn = insns; insn; insn = NEXT_INSN (insn))
2144         if (reg_mentioned_p (XEXP (x, 0), insn))
2145           {
2146             REG_NOTES (insn) = gen_rtx_INSN_LIST (REG_LABEL, XEXP (x, 0),
2147                                                   REG_NOTES (insn));
2148             if (LABEL_P (XEXP (x, 0)))
2149               LABEL_NUSES (XEXP (x, 0))++;
2150           }
2151     }
2152
2153   fmt = GET_RTX_FORMAT (code);
2154   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2155     {
2156       if (fmt[i] == 'e')
2157         add_label_notes (XEXP (x, i), insns);
2158       else if (fmt[i] == 'E')
2159         for (j = XVECLEN (x, i) - 1; j >= 0; j--)
2160           add_label_notes (XVECEXP (x, i, j), insns);
2161     }
2162 }
2163 \f
2164 /* Scan MOVABLES, and move the insns that deserve to be moved.
2165    If two matching movables are combined, replace one reg with the
2166    other throughout.  */
2167
2168 static void
2169 move_movables (struct loop *loop, struct loop_movables *movables,
2170                int threshold, int insn_count)
2171 {
2172   struct loop_regs *regs = LOOP_REGS (loop);
2173   int nregs = regs->num;
2174   rtx new_start = 0;
2175   struct movable *m;
2176   rtx p;
2177   rtx loop_start = loop->start;
2178   rtx loop_end = loop->end;
2179   /* Map of pseudo-register replacements to handle combining
2180      when we move several insns that load the same value
2181      into different pseudo-registers.  */
2182   rtx *reg_map = xcalloc (nregs, sizeof (rtx));
2183   char *already_moved = xcalloc (nregs, sizeof (char));
2184
2185   for (m = movables->head; m; m = m->next)
2186     {
2187       /* Describe this movable insn.  */
2188
2189       if (loop_dump_stream)
2190         {
2191           fprintf (loop_dump_stream, "Insn %d: regno %d (life %d), ",
2192                    INSN_UID (m->insn), m->regno, m->lifetime);
2193           if (m->consec > 0)
2194             fprintf (loop_dump_stream, "consec %d, ", m->consec);
2195           if (m->cond)
2196             fprintf (loop_dump_stream, "cond ");
2197           if (m->force)
2198             fprintf (loop_dump_stream, "force ");
2199           if (m->global)
2200             fprintf (loop_dump_stream, "global ");
2201           if (m->done)
2202             fprintf (loop_dump_stream, "done ");
2203           if (m->move_insn)
2204             fprintf (loop_dump_stream, "move-insn ");
2205           if (m->match)
2206             fprintf (loop_dump_stream, "matches %d ",
2207                      INSN_UID (m->match->insn));
2208           if (m->forces)
2209             fprintf (loop_dump_stream, "forces %d ",
2210                      INSN_UID (m->forces->insn));
2211         }
2212
2213       /* Ignore the insn if it's already done (it matched something else).
2214          Otherwise, see if it is now safe to move.  */
2215
2216       if (!m->done
2217           && (! m->cond
2218               || (1 == loop_invariant_p (loop, m->set_src)
2219                   && (m->dependencies == 0
2220                       || 1 == loop_invariant_p (loop, m->dependencies))
2221                   && (m->consec == 0
2222                       || 1 == consec_sets_invariant_p (loop, m->set_dest,
2223                                                        m->consec + 1,
2224                                                        m->insn))))
2225           && (! m->forces || m->forces->done))
2226         {
2227           int regno;
2228           rtx p;
2229           int savings = m->savings;
2230
2231           /* We have an insn that is safe to move.
2232              Compute its desirability.  */
2233
2234           p = m->insn;
2235           regno = m->regno;
2236
2237           if (loop_dump_stream)
2238             fprintf (loop_dump_stream, "savings %d ", savings);
2239
2240           if (regs->array[regno].moved_once && loop_dump_stream)
2241             fprintf (loop_dump_stream, "halved since already moved ");
2242
2243           /* An insn MUST be moved if we already moved something else
2244              which is safe only if this one is moved too: that is,
2245              if already_moved[REGNO] is nonzero.  */
2246
2247           /* An insn is desirable to move if the new lifetime of the
2248              register is no more than THRESHOLD times the old lifetime.
2249              If it's not desirable, it means the loop is so big
2250              that moving won't speed things up much,
2251              and it is liable to make register usage worse.  */
2252
2253           /* It is also desirable to move if it can be moved at no
2254              extra cost because something else was already moved.  */
2255
2256           if (already_moved[regno]
2257               || (threshold * savings * m->lifetime) >=
2258                  (regs->array[regno].moved_once ? insn_count * 2 : insn_count)
2259               || (m->forces && m->forces->done
2260                   && regs->array[m->forces->regno].n_times_set == 1))
2261             {
2262               int count;
2263               struct movable *m1;
2264               rtx first = NULL_RTX;
2265               rtx newreg = NULL_RTX;
2266
2267               if (m->insert_temp)
2268                 newreg = gen_reg_rtx (GET_MODE (m->set_dest));
2269
2270               /* Now move the insns that set the reg.  */
2271
2272               if (m->partial && m->match)
2273                 {
2274                   rtx newpat, i1;
2275                   rtx r1, r2;
2276                   /* Find the end of this chain of matching regs.
2277                      Thus, we load each reg in the chain from that one reg.
2278                      And that reg is loaded with 0 directly,
2279                      since it has ->match == 0.  */
2280                   for (m1 = m; m1->match; m1 = m1->match);
2281                   newpat = gen_move_insn (SET_DEST (PATTERN (m->insn)),
2282                                           SET_DEST (PATTERN (m1->insn)));
2283                   i1 = loop_insn_hoist (loop, newpat);
2284
2285                   /* Mark the moved, invariant reg as being allowed to
2286                      share a hard reg with the other matching invariant.  */
2287                   REG_NOTES (i1) = REG_NOTES (m->insn);
2288                   r1 = SET_DEST (PATTERN (m->insn));
2289                   r2 = SET_DEST (PATTERN (m1->insn));
2290                   regs_may_share
2291                     = gen_rtx_EXPR_LIST (VOIDmode, r1,
2292                                          gen_rtx_EXPR_LIST (VOIDmode, r2,
2293                                                             regs_may_share));
2294                   delete_insn (m->insn);
2295
2296                   if (new_start == 0)
2297                     new_start = i1;
2298
2299                   if (loop_dump_stream)
2300                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
2301                 }
2302               /* If we are to re-generate the item being moved with a
2303                  new move insn, first delete what we have and then emit
2304                  the move insn before the loop.  */
2305               else if (m->move_insn)
2306                 {
2307                   rtx i1, temp, seq;
2308
2309                   for (count = m->consec; count >= 0; count--)
2310                     {
2311                       if (!NOTE_P (p))
2312                         {
2313                           /* If this is the first insn of a library
2314                              call sequence, something is very
2315                              wrong.  */
2316                           gcc_assert (!find_reg_note
2317                                       (p, REG_LIBCALL, NULL_RTX));
2318
2319                           /* If this is the last insn of a libcall
2320                              sequence, then delete every insn in the
2321                              sequence except the last.  The last insn
2322                              is handled in the normal manner.  */
2323                           temp = find_reg_note (p, REG_RETVAL, NULL_RTX);
2324
2325                           if (temp)
2326                             {
2327                               temp = XEXP (temp, 0);
2328                               while (temp != p)
2329                                 temp = delete_insn (temp);
2330                             }
2331                         }
2332
2333                       temp = p;
2334                       p = delete_insn (p);
2335
2336                       /* simplify_giv_expr expects that it can walk the insns
2337                          at m->insn forwards and see this old sequence we are
2338                          tossing here.  delete_insn does preserve the next
2339                          pointers, but when we skip over a NOTE we must fix
2340                          it up.  Otherwise that code walks into the non-deleted
2341                          insn stream.  */
2342                       while (p && NOTE_P (p))
2343                         p = NEXT_INSN (temp) = NEXT_INSN (p);
2344
2345                       if (m->insert_temp)
2346                         {
2347                           /* Replace the original insn with a move from
2348                              our newly created temp.  */
2349                           start_sequence ();
2350                           emit_move_insn (m->set_dest, newreg);
2351                           seq = get_insns ();
2352                           end_sequence ();
2353                           emit_insn_before (seq, p);
2354                         }
2355                     }
2356
2357                   start_sequence ();
2358                   emit_move_insn (m->insert_temp ? newreg : m->set_dest,
2359                                   m->set_src);
2360                   seq = get_insns ();
2361                   end_sequence ();
2362
2363                   add_label_notes (m->set_src, seq);
2364
2365                   i1 = loop_insn_hoist (loop, seq);
2366                   if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
2367                     set_unique_reg_note (i1,
2368                                          m->is_equiv ? REG_EQUIV : REG_EQUAL,
2369                                          m->set_src);
2370
2371                   if (loop_dump_stream)
2372                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
2373
2374                   /* The more regs we move, the less we like moving them.  */
2375                   threshold -= 3;
2376                 }
2377               else
2378                 {
2379                   for (count = m->consec; count >= 0; count--)
2380                     {
2381                       rtx i1, temp;
2382
2383                       /* If first insn of libcall sequence, skip to end.  */
2384                       /* Do this at start of loop, since p is guaranteed to
2385                          be an insn here.  */
2386                       if (!NOTE_P (p)
2387                           && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
2388                         p = XEXP (temp, 0);
2389
2390                       /* If last insn of libcall sequence, move all
2391                          insns except the last before the loop.  The last
2392                          insn is handled in the normal manner.  */
2393                       if (!NOTE_P (p)
2394                           && (temp = find_reg_note (p, REG_RETVAL, NULL_RTX)))
2395                         {
2396                           rtx fn_address = 0;
2397                           rtx fn_reg = 0;
2398                           rtx fn_address_insn = 0;
2399
2400                           first = 0;
2401                           for (temp = XEXP (temp, 0); temp != p;
2402                                temp = NEXT_INSN (temp))
2403                             {
2404                               rtx body;
2405                               rtx n;
2406                               rtx next;
2407
2408                               if (NOTE_P (temp))
2409                                 continue;
2410
2411                               body = PATTERN (temp);
2412
2413                               /* Find the next insn after TEMP,
2414                                  not counting USE or NOTE insns.  */
2415                               for (next = NEXT_INSN (temp); next != p;
2416                                    next = NEXT_INSN (next))
2417                                 if (! (NONJUMP_INSN_P (next)
2418                                        && GET_CODE (PATTERN (next)) == USE)
2419                                     && !NOTE_P (next))
2420                                   break;
2421
2422                               /* If that is the call, this may be the insn
2423                                  that loads the function address.
2424
2425                                  Extract the function address from the insn
2426                                  that loads it into a register.
2427                                  If this insn was cse'd, we get incorrect code.
2428
2429                                  So emit a new move insn that copies the
2430                                  function address into the register that the
2431                                  call insn will use.  flow.c will delete any
2432                                  redundant stores that we have created.  */
2433                               if (CALL_P (next)
2434                                   && GET_CODE (body) == SET
2435                                   && REG_P (SET_DEST (body))
2436                                   && (n = find_reg_note (temp, REG_EQUAL,
2437                                                          NULL_RTX)))
2438                                 {
2439                                   fn_reg = SET_SRC (body);
2440                                   if (!REG_P (fn_reg))
2441                                     fn_reg = SET_DEST (body);
2442                                   fn_address = XEXP (n, 0);
2443                                   fn_address_insn = temp;
2444                                 }
2445                               /* We have the call insn.
2446                                  If it uses the register we suspect it might,
2447                                  load it with the correct address directly.  */
2448                               if (CALL_P (temp)
2449                                   && fn_address != 0
2450                                   && reg_referenced_p (fn_reg, body))
2451                                 loop_insn_emit_after (loop, 0, fn_address_insn,
2452                                                       gen_move_insn
2453                                                       (fn_reg, fn_address));
2454
2455                               if (CALL_P (temp))
2456                                 {
2457                                   i1 = loop_call_insn_hoist (loop, body);
2458                                   /* Because the USAGE information potentially
2459                                      contains objects other than hard registers
2460                                      we need to copy it.  */
2461                                   if (CALL_INSN_FUNCTION_USAGE (temp))
2462                                     CALL_INSN_FUNCTION_USAGE (i1)
2463                                       = copy_rtx (CALL_INSN_FUNCTION_USAGE (temp));
2464                                 }
2465                               else
2466                                 i1 = loop_insn_hoist (loop, body);
2467                               if (first == 0)
2468                                 first = i1;
2469                               if (temp == fn_address_insn)
2470                                 fn_address_insn = i1;
2471                               REG_NOTES (i1) = REG_NOTES (temp);
2472                               REG_NOTES (temp) = NULL;
2473                               delete_insn (temp);
2474                             }
2475                           if (new_start == 0)
2476                             new_start = first;
2477                         }
2478                       if (m->savemode != VOIDmode)
2479                         {
2480                           /* P sets REG to zero; but we should clear only
2481                              the bits that are not covered by the mode
2482                              m->savemode.  */
2483                           rtx reg = m->set_dest;
2484                           rtx sequence;
2485                           rtx tem;
2486
2487                           start_sequence ();
2488                           tem = expand_simple_binop
2489                             (GET_MODE (reg), AND, reg,
2490                              GEN_INT ((((HOST_WIDE_INT) 1
2491                                         << GET_MODE_BITSIZE (m->savemode)))
2492                                       - 1),
2493                              reg, 1, OPTAB_LIB_WIDEN);
2494                           gcc_assert (tem);
2495                           if (tem != reg)
2496                             emit_move_insn (reg, tem);
2497                           sequence = get_insns ();
2498                           end_sequence ();
2499                           i1 = loop_insn_hoist (loop, sequence);
2500                         }
2501                       else if (CALL_P (p))
2502                         {
2503                           i1 = loop_call_insn_hoist (loop, PATTERN (p));
2504                           /* Because the USAGE information potentially
2505                              contains objects other than hard registers
2506                              we need to copy it.  */
2507                           if (CALL_INSN_FUNCTION_USAGE (p))
2508                             CALL_INSN_FUNCTION_USAGE (i1)
2509                               = copy_rtx (CALL_INSN_FUNCTION_USAGE (p));
2510                         }
2511                       else if (count == m->consec && m->move_insn_first)
2512                         {
2513                           rtx seq;
2514                           /* The SET_SRC might not be invariant, so we must
2515                              use the REG_EQUAL note.  */
2516                           start_sequence ();
2517                           emit_move_insn (m->insert_temp ? newreg : m->set_dest,
2518                                           m->set_src);
2519                           seq = get_insns ();
2520                           end_sequence ();
2521
2522                           add_label_notes (m->set_src, seq);
2523
2524                           i1 = loop_insn_hoist (loop, seq);
2525                           if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
2526                             set_unique_reg_note (i1, m->is_equiv ? REG_EQUIV
2527                                                      : REG_EQUAL, m->set_src);
2528                         }
2529                       else if (m->insert_temp)
2530                         {
2531                           rtx *reg_map2 = xcalloc (REGNO (newreg),
2532                                                    sizeof(rtx));
2533                           reg_map2 [m->regno] = newreg;
2534
2535                           i1 = loop_insn_hoist (loop, copy_rtx (PATTERN (p)));
2536                           replace_regs (i1, reg_map2, REGNO (newreg), 1);
2537                           free (reg_map2);
2538                         }
2539                       else
2540                         i1 = loop_insn_hoist (loop, PATTERN (p));
2541
2542                       if (REG_NOTES (i1) == 0)
2543                         {
2544                           REG_NOTES (i1) = REG_NOTES (p);
2545                           REG_NOTES (p) = NULL;
2546
2547                           /* If there is a REG_EQUAL note present whose value
2548                              is not loop invariant, then delete it, since it
2549                              may cause problems with later optimization passes.
2550                              It is possible for cse to create such notes
2551                              like this as a result of record_jump_cond.  */
2552
2553                           if ((temp = find_reg_note (i1, REG_EQUAL, NULL_RTX))
2554                               && ! loop_invariant_p (loop, XEXP (temp, 0)))
2555                             remove_note (i1, temp);
2556                         }
2557
2558                       if (new_start == 0)
2559                         new_start = i1;
2560
2561                       if (loop_dump_stream)
2562                         fprintf (loop_dump_stream, " moved to %d",
2563                                  INSN_UID (i1));
2564
2565                       /* If library call, now fix the REG_NOTES that contain
2566                          insn pointers, namely REG_LIBCALL on FIRST
2567                          and REG_RETVAL on I1.  */
2568                       if ((temp = find_reg_note (i1, REG_RETVAL, NULL_RTX)))
2569                         {
2570                           XEXP (temp, 0) = first;
2571                           temp = find_reg_note (first, REG_LIBCALL, NULL_RTX);
2572                           XEXP (temp, 0) = i1;
2573                         }
2574
2575                       temp = p;
2576                       delete_insn (p);
2577                       p = NEXT_INSN (p);
2578
2579                       /* simplify_giv_expr expects that it can walk the insns
2580                          at m->insn forwards and see this old sequence we are
2581                          tossing here.  delete_insn does preserve the next
2582                          pointers, but when we skip over a NOTE we must fix
2583                          it up.  Otherwise that code walks into the non-deleted
2584                          insn stream.  */
2585                       while (p && NOTE_P (p))
2586                         p = NEXT_INSN (temp) = NEXT_INSN (p);
2587
2588                       if (m->insert_temp)
2589                         {
2590                           rtx seq;
2591                           /* Replace the original insn with a move from
2592                              our newly created temp.  */
2593                           start_sequence ();
2594                           emit_move_insn (m->set_dest, newreg);
2595                           seq = get_insns ();
2596                           end_sequence ();
2597                           emit_insn_before (seq, p);
2598                         }
2599                     }
2600
2601                   /* The more regs we move, the less we like moving them.  */
2602                   threshold -= 3;
2603                 }
2604
2605               m->done = 1;
2606
2607               if (!m->insert_temp)
2608                 {
2609                   /* Any other movable that loads the same register
2610                      MUST be moved.  */
2611                   already_moved[regno] = 1;
2612
2613                   /* This reg has been moved out of one loop.  */
2614                   regs->array[regno].moved_once = 1;
2615
2616                   /* The reg set here is now invariant.  */
2617                   if (! m->partial)
2618                     {
2619                       int i;
2620                       for (i = 0; i < LOOP_REGNO_NREGS (regno, m->set_dest); i++)
2621                         regs->array[regno+i].set_in_loop = 0;
2622                     }
2623
2624                   /* Change the length-of-life info for the register
2625                      to say it lives at least the full length of this loop.
2626                      This will help guide optimizations in outer loops.  */
2627
2628                   if (REGNO_FIRST_LUID (regno) > INSN_LUID (loop_start))
2629                     /* This is the old insn before all the moved insns.
2630                        We can't use the moved insn because it is out of range
2631                        in uid_luid.  Only the old insns have luids.  */
2632                     REGNO_FIRST_UID (regno) = INSN_UID (loop_start);
2633                   if (REGNO_LAST_LUID (regno) < INSN_LUID (loop_end))
2634                     REGNO_LAST_UID (regno) = INSN_UID (loop_end);
2635                 }
2636
2637               /* Combine with this moved insn any other matching movables.  */
2638
2639               if (! m->partial)
2640                 for (m1 = movables->head; m1; m1 = m1->next)
2641                   if (m1->match == m)
2642                     {
2643                       rtx temp;
2644
2645                       /* Schedule the reg loaded by M1
2646                          for replacement so that shares the reg of M.
2647                          If the modes differ (only possible in restricted
2648                          circumstances, make a SUBREG.
2649
2650                          Note this assumes that the target dependent files
2651                          treat REG and SUBREG equally, including within
2652                          GO_IF_LEGITIMATE_ADDRESS and in all the
2653                          predicates since we never verify that replacing the
2654                          original register with a SUBREG results in a
2655                          recognizable insn.  */
2656                       if (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest))
2657                         reg_map[m1->regno] = m->set_dest;
2658                       else
2659                         reg_map[m1->regno]
2660                           = gen_lowpart_common (GET_MODE (m1->set_dest),
2661                                                 m->set_dest);
2662
2663                       /* Get rid of the matching insn
2664                          and prevent further processing of it.  */
2665                       m1->done = 1;
2666
2667                       /* If library call, delete all insns.  */
2668                       if ((temp = find_reg_note (m1->insn, REG_RETVAL,
2669                                                  NULL_RTX)))
2670                         delete_insn_chain (XEXP (temp, 0), m1->insn);
2671                       else
2672                         delete_insn (m1->insn);
2673
2674                       /* Any other movable that loads the same register
2675                          MUST be moved.  */
2676                       already_moved[m1->regno] = 1;
2677
2678                       /* The reg merged here is now invariant,
2679                          if the reg it matches is invariant.  */
2680                       if (! m->partial)
2681                         {
2682                           int i;
2683                           for (i = 0;
2684                                i < LOOP_REGNO_NREGS (regno, m1->set_dest);
2685                                i++)
2686                             regs->array[m1->regno+i].set_in_loop = 0;
2687                         }
2688                     }
2689             }
2690           else if (loop_dump_stream)
2691             fprintf (loop_dump_stream, "not desirable");
2692         }
2693       else if (loop_dump_stream && !m->match)
2694         fprintf (loop_dump_stream, "not safe");
2695
2696       if (loop_dump_stream)
2697         fprintf (loop_dump_stream, "\n");
2698     }
2699
2700   if (new_start == 0)
2701     new_start = loop_start;
2702
2703   /* Go through all the instructions in the loop, making
2704      all the register substitutions scheduled in REG_MAP.  */
2705   for (p = new_start; p != loop_end; p = NEXT_INSN (p))
2706     if (INSN_P (p))
2707       {
2708         replace_regs (PATTERN (p), reg_map, nregs, 0);
2709         replace_regs (REG_NOTES (p), reg_map, nregs, 0);
2710         INSN_CODE (p) = -1;
2711       }
2712
2713   /* Clean up.  */
2714   free (reg_map);
2715   free (already_moved);
2716 }
2717
2718
2719 static void
2720 loop_movables_add (struct loop_movables *movables, struct movable *m)
2721 {
2722   if (movables->head == 0)
2723     movables->head = m;
2724   else
2725     movables->last->next = m;
2726   movables->last = m;
2727 }
2728
2729
2730 static void
2731 loop_movables_free (struct loop_movables *movables)
2732 {
2733   struct movable *m;
2734   struct movable *m_next;
2735
2736   for (m = movables->head; m; m = m_next)
2737     {
2738       m_next = m->next;
2739       free (m);
2740     }
2741 }
2742 \f
2743 #if 0
2744 /* Scan X and replace the address of any MEM in it with ADDR.
2745    REG is the address that MEM should have before the replacement.  */
2746
2747 static void
2748 replace_call_address (rtx x, rtx reg, rtx addr)
2749 {
2750   enum rtx_code code;
2751   int i;
2752   const char *fmt;
2753
2754   if (x == 0)
2755     return;
2756   code = GET_CODE (x);
2757   switch (code)
2758     {
2759     case PC:
2760     case CC0:
2761     case CONST_INT:
2762     case CONST_DOUBLE:
2763     case CONST:
2764     case SYMBOL_REF:
2765     case LABEL_REF:
2766     case REG:
2767       return;
2768
2769     case SET:
2770       /* Short cut for very common case.  */
2771       replace_call_address (XEXP (x, 1), reg, addr);
2772       return;
2773
2774     case CALL:
2775       /* Short cut for very common case.  */
2776       replace_call_address (XEXP (x, 0), reg, addr);
2777       return;
2778
2779     case MEM:
2780       /* If this MEM uses a reg other than the one we expected,
2781          something is wrong.  */
2782       gcc_assert (XEXP (x, 0) == reg);
2783       XEXP (x, 0) = addr;
2784       return;
2785
2786     default:
2787       break;
2788     }
2789
2790   fmt = GET_RTX_FORMAT (code);
2791   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2792     {
2793       if (fmt[i] == 'e')
2794         replace_call_address (XEXP (x, i), reg, addr);
2795       else if (fmt[i] == 'E')
2796         {
2797           int j;
2798           for (j = 0; j < XVECLEN (x, i); j++)
2799             replace_call_address (XVECEXP (x, i, j), reg, addr);
2800         }
2801     }
2802 }
2803 #endif
2804 \f
2805 /* Return the number of memory refs to addresses that vary
2806    in the rtx X.  */
2807
2808 static int
2809 count_nonfixed_reads (const struct loop *loop, rtx x)
2810 {
2811   enum rtx_code code;
2812   int i;
2813   const char *fmt;
2814   int value;
2815
2816   if (x == 0)
2817     return 0;
2818
2819   code = GET_CODE (x);
2820   switch (code)
2821     {
2822     case PC:
2823     case CC0:
2824     case CONST_INT:
2825     case CONST_DOUBLE:
2826     case CONST:
2827     case SYMBOL_REF:
2828     case LABEL_REF:
2829     case REG:
2830       return 0;
2831
2832     case MEM:
2833       return ((loop_invariant_p (loop, XEXP (x, 0)) != 1)
2834               + count_nonfixed_reads (loop, XEXP (x, 0)));
2835
2836     default:
2837       break;
2838     }
2839
2840   value = 0;
2841   fmt = GET_RTX_FORMAT (code);
2842   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2843     {
2844       if (fmt[i] == 'e')
2845         value += count_nonfixed_reads (loop, XEXP (x, i));
2846       if (fmt[i] == 'E')
2847         {
2848           int j;
2849           for (j = 0; j < XVECLEN (x, i); j++)
2850             value += count_nonfixed_reads (loop, XVECEXP (x, i, j));
2851         }
2852     }
2853   return value;
2854 }
2855 \f
2856 /* Scan a loop setting the elements `loops_enclosed',
2857    `has_call', `has_nonconst_call', `has_volatile', `has_tablejump',
2858    `unknown_address_altered', `unknown_constant_address_altered', and
2859    `num_mem_sets' in LOOP.  Also, fill in the array `mems' and the
2860    list `store_mems' in LOOP.  */
2861
2862 static void
2863 prescan_loop (struct loop *loop)
2864 {
2865   int level = 1;
2866   rtx insn;
2867   struct loop_info *loop_info = LOOP_INFO (loop);
2868   rtx start = loop->start;
2869   rtx end = loop->end;
2870   /* The label after END.  Jumping here is just like falling off the
2871      end of the loop.  We use next_nonnote_insn instead of next_label
2872      as a hedge against the (pathological) case where some actual insn
2873      might end up between the two.  */
2874   rtx exit_target = next_nonnote_insn (end);
2875
2876   loop_info->has_indirect_jump = indirect_jump_in_function;
2877   loop_info->pre_header_has_call = 0;
2878   loop_info->has_call = 0;
2879   loop_info->has_nonconst_call = 0;
2880   loop_info->has_prefetch = 0;
2881   loop_info->has_volatile = 0;
2882   loop_info->has_tablejump = 0;
2883   loop_info->has_multiple_exit_targets = 0;
2884   loop->level = 1;
2885
2886   loop_info->unknown_address_altered = 0;
2887   loop_info->unknown_constant_address_altered = 0;
2888   loop_info->store_mems = NULL_RTX;
2889   loop_info->first_loop_store_insn = NULL_RTX;
2890   loop_info->mems_idx = 0;
2891   loop_info->num_mem_sets = 0;
2892
2893   for (insn = start; insn && !LABEL_P (insn);
2894        insn = PREV_INSN (insn))
2895     {
2896       if (CALL_P (insn))
2897         {
2898           loop_info->pre_header_has_call = 1;
2899           break;
2900         }
2901     }
2902
2903   for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
2904        insn = NEXT_INSN (insn))
2905     {
2906       switch (GET_CODE (insn))
2907         {
2908         case NOTE:
2909           if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
2910             {
2911               ++level;
2912               /* Count number of loops contained in this one.  */
2913               loop->level++;
2914             }
2915           else if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_END)
2916             --level;
2917           break;
2918
2919         case CALL_INSN:
2920           if (! CONST_OR_PURE_CALL_P (insn))
2921             {
2922               loop_info->unknown_address_altered = 1;
2923               loop_info->has_nonconst_call = 1;
2924             }
2925           else if (pure_call_p (insn))
2926             loop_info->has_nonconst_call = 1;
2927           loop_info->has_call = 1;
2928           if (can_throw_internal (insn))
2929             loop_info->has_multiple_exit_targets = 1;
2930           break;
2931
2932         case JUMP_INSN:
2933           if (! loop_info->has_multiple_exit_targets)
2934             {
2935               rtx set = pc_set (insn);
2936
2937               if (set)
2938                 {
2939                   rtx src = SET_SRC (set);
2940                   rtx label1, label2;
2941
2942                   if (GET_CODE (src) == IF_THEN_ELSE)
2943                     {
2944                       label1 = XEXP (src, 1);
2945                       label2 = XEXP (src, 2);
2946                     }
2947                   else
2948                     {
2949                       label1 = src;
2950                       label2 = NULL_RTX;
2951                     }
2952
2953                   do
2954                     {
2955                       if (label1 && label1 != pc_rtx)
2956                         {
2957                           if (GET_CODE (label1) != LABEL_REF)
2958                             {
2959                               /* Something tricky.  */
2960                               loop_info->has_multiple_exit_targets = 1;
2961                               break;
2962                             }
2963                           else if (XEXP (label1, 0) != exit_target
2964                                    && LABEL_OUTSIDE_LOOP_P (label1))
2965                             {
2966                               /* A jump outside the current loop.  */
2967                               loop_info->has_multiple_exit_targets = 1;
2968                               break;
2969                             }
2970                         }
2971
2972                       label1 = label2;
2973                       label2 = NULL_RTX;
2974                     }
2975                   while (label1);
2976                 }
2977               else
2978                 {
2979                   /* A return, or something tricky.  */
2980                   loop_info->has_multiple_exit_targets = 1;
2981                 }
2982             }
2983           /* Fall through.  */
2984
2985         case INSN:
2986           if (volatile_refs_p (PATTERN (insn)))
2987             loop_info->has_volatile = 1;
2988
2989           if (JUMP_P (insn)
2990               && (GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC
2991                   || GET_CODE (PATTERN (insn)) == ADDR_VEC))
2992             loop_info->has_tablejump = 1;
2993
2994           note_stores (PATTERN (insn), note_addr_stored, loop_info);
2995           if (! loop_info->first_loop_store_insn && loop_info->store_mems)
2996             loop_info->first_loop_store_insn = insn;
2997
2998           if (flag_non_call_exceptions && can_throw_internal (insn))
2999             loop_info->has_multiple_exit_targets = 1;
3000           break;
3001
3002         default:
3003           break;
3004         }
3005     }
3006
3007   /* Now, rescan the loop, setting up the LOOP_MEMS array.  */
3008   if (/* An exception thrown by a called function might land us
3009          anywhere.  */
3010       ! loop_info->has_nonconst_call
3011       /* We don't want loads for MEMs moved to a location before the
3012          one at which their stack memory becomes allocated.  (Note
3013          that this is not a problem for malloc, etc., since those
3014          require actual function calls.  */
3015       && ! current_function_calls_alloca
3016       /* There are ways to leave the loop other than falling off the
3017          end.  */
3018       && ! loop_info->has_multiple_exit_targets)
3019     for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
3020          insn = NEXT_INSN (insn))
3021       for_each_rtx (&insn, insert_loop_mem, loop_info);
3022
3023   /* BLKmode MEMs are added to LOOP_STORE_MEM as necessary so
3024      that loop_invariant_p and load_mems can use true_dependence
3025      to determine what is really clobbered.  */
3026   if (loop_info->unknown_address_altered)
3027     {
3028       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
3029
3030       loop_info->store_mems
3031         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
3032     }
3033   if (loop_info->unknown_constant_address_altered)
3034     {
3035       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
3036       MEM_READONLY_P (mem) = 1;
3037       loop_info->store_mems
3038         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
3039     }
3040 }
3041 \f
3042 /* Invalidate all loops containing LABEL.  */
3043
3044 static void
3045 invalidate_loops_containing_label (rtx label)
3046 {
3047   struct loop *loop;
3048   for (loop = uid_loop[INSN_UID (label)]; loop; loop = loop->outer)
3049     loop->invalid = 1;
3050 }
3051
3052 /* Scan the function looking for loops.  Record the start and end of each loop.
3053    Also mark as invalid loops any loops that contain a setjmp or are branched
3054    to from outside the loop.  */
3055
3056 static void
3057 find_and_verify_loops (rtx f, struct loops *loops)
3058 {
3059   rtx insn;
3060   rtx label;
3061   int num_loops;
3062   struct loop *current_loop;
3063   struct loop *next_loop;
3064   struct loop *loop;
3065
3066   num_loops = loops->num;
3067
3068   compute_luids (f, NULL_RTX, 0);
3069
3070   /* If there are jumps to undefined labels,
3071      treat them as jumps out of any/all loops.
3072      This also avoids writing past end of tables when there are no loops.  */
3073   uid_loop[0] = NULL;
3074
3075   /* Find boundaries of loops, mark which loops are contained within
3076      loops, and invalidate loops that have setjmp.  */
3077
3078   num_loops = 0;
3079   current_loop = NULL;
3080   for (insn = f; insn; insn = NEXT_INSN (insn))
3081     {
3082       if (NOTE_P (insn))
3083         switch (NOTE_LINE_NUMBER (insn))
3084           {
3085           case NOTE_INSN_LOOP_BEG:
3086             next_loop = loops->array + num_loops;
3087             next_loop->num = num_loops;
3088             num_loops++;
3089             next_loop->start = insn;
3090             next_loop->outer = current_loop;
3091             current_loop = next_loop;
3092             break;
3093
3094           case NOTE_INSN_LOOP_END:
3095             gcc_assert (current_loop);
3096
3097             current_loop->end = insn;
3098             current_loop = current_loop->outer;
3099             break;
3100
3101           default:
3102             break;
3103           }
3104
3105       if (CALL_P (insn)
3106           && find_reg_note (insn, REG_SETJMP, NULL))
3107         {
3108           /* In this case, we must invalidate our current loop and any
3109              enclosing loop.  */
3110           for (loop = current_loop; loop; loop = loop->outer)
3111             {
3112               loop->invalid = 1;
3113               if (loop_dump_stream)
3114                 fprintf (loop_dump_stream,
3115                          "\nLoop at %d ignored due to setjmp.\n",
3116                          INSN_UID (loop->start));
3117             }
3118         }
3119
3120       /* Note that this will mark the NOTE_INSN_LOOP_END note as being in the
3121          enclosing loop, but this doesn't matter.  */
3122       uid_loop[INSN_UID (insn)] = current_loop;
3123     }
3124
3125   /* Any loop containing a label used in an initializer must be invalidated,
3126      because it can be jumped into from anywhere.  */
3127   for (label = forced_labels; label; label = XEXP (label, 1))
3128     invalidate_loops_containing_label (XEXP (label, 0));
3129
3130   /* Any loop containing a label used for an exception handler must be
3131      invalidated, because it can be jumped into from anywhere.  */
3132   for_each_eh_label (invalidate_loops_containing_label);
3133
3134   /* Now scan all insn's in the function.  If any JUMP_INSN branches into a
3135      loop that it is not contained within, that loop is marked invalid.
3136      If any INSN or CALL_INSN uses a label's address, then the loop containing
3137      that label is marked invalid, because it could be jumped into from
3138      anywhere.
3139
3140      Also look for blocks of code ending in an unconditional branch that
3141      exits the loop.  If such a block is surrounded by a conditional
3142      branch around the block, move the block elsewhere (see below) and
3143      invert the jump to point to the code block.  This may eliminate a
3144      label in our loop and will simplify processing by both us and a
3145      possible second cse pass.  */
3146
3147   for (insn = f; insn; insn = NEXT_INSN (insn))
3148     if (INSN_P (insn))
3149       {
3150         struct loop *this_loop = uid_loop[INSN_UID (insn)];
3151
3152         if (NONJUMP_INSN_P (insn) || CALL_P (insn))
3153           {
3154             rtx note = find_reg_note (insn, REG_LABEL, NULL_RTX);
3155             if (note)
3156               invalidate_loops_containing_label (XEXP (note, 0));
3157           }
3158
3159         if (!JUMP_P (insn))
3160           continue;
3161
3162         mark_loop_jump (PATTERN (insn), this_loop);
3163
3164         /* See if this is an unconditional branch outside the loop.  */
3165         if (this_loop
3166             && (GET_CODE (PATTERN (insn)) == RETURN
3167                 || (any_uncondjump_p (insn)
3168                     && onlyjump_p (insn)
3169                     && (uid_loop[INSN_UID (JUMP_LABEL (insn))]
3170                         != this_loop)))
3171             && get_max_uid () < max_uid_for_loop)
3172           {
3173             rtx p;
3174             rtx our_next = next_real_insn (insn);
3175             rtx last_insn_to_move = NEXT_INSN (insn);
3176             struct loop *dest_loop;
3177             struct loop *outer_loop = NULL;
3178
3179             /* Go backwards until we reach the start of the loop, a label,
3180                or a JUMP_INSN.  */
3181             for (p = PREV_INSN (insn);
3182                  !LABEL_P (p)
3183                  && ! (NOTE_P (p)
3184                        && NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
3185                  && !JUMP_P (p);
3186                  p = PREV_INSN (p))
3187               ;
3188
3189             /* Check for the case where we have a jump to an inner nested
3190                loop, and do not perform the optimization in that case.  */
3191
3192             if (JUMP_LABEL (insn))
3193               {
3194                 dest_loop = uid_loop[INSN_UID (JUMP_LABEL (insn))];
3195                 if (dest_loop)
3196                   {
3197                     for (outer_loop = dest_loop; outer_loop;
3198                          outer_loop = outer_loop->outer)
3199                       if (outer_loop == this_loop)
3200                         break;
3201                   }
3202               }
3203
3204             /* Make sure that the target of P is within the current loop.  */
3205
3206             if (JUMP_P (p) && JUMP_LABEL (p)
3207                 && uid_loop[INSN_UID (JUMP_LABEL (p))] != this_loop)
3208               outer_loop = this_loop;
3209
3210             /* If we stopped on a JUMP_INSN to the next insn after INSN,
3211                we have a block of code to try to move.
3212
3213                We look backward and then forward from the target of INSN
3214                to find a BARRIER at the same loop depth as the target.
3215                If we find such a BARRIER, we make a new label for the start
3216                of the block, invert the jump in P and point it to that label,
3217                and move the block of code to the spot we found.  */
3218
3219             if (! outer_loop
3220                 && JUMP_P (p)
3221                 && JUMP_LABEL (p) != 0
3222                 /* Just ignore jumps to labels that were never emitted.
3223                    These always indicate compilation errors.  */
3224                 && INSN_UID (JUMP_LABEL (p)) != 0
3225                 && any_condjump_p (p) && onlyjump_p (p)
3226                 && next_real_insn (JUMP_LABEL (p)) == our_next
3227                 /* If it's not safe to move the sequence, then we
3228                    mustn't try.  */
3229                 && insns_safe_to_move_p (p, NEXT_INSN (insn),
3230                                          &last_insn_to_move))
3231               {
3232                 rtx target
3233                   = JUMP_LABEL (insn) ? JUMP_LABEL (insn) : get_last_insn ();
3234                 struct loop *target_loop = uid_loop[INSN_UID (target)];
3235                 rtx loc, loc2;
3236                 rtx tmp;
3237
3238                 /* Search for possible garbage past the conditional jumps
3239                    and look for the last barrier.  */
3240                 for (tmp = last_insn_to_move;
3241                      tmp && !LABEL_P (tmp); tmp = NEXT_INSN (tmp))
3242                   if (BARRIER_P (tmp))
3243                     last_insn_to_move = tmp;
3244
3245                 for (loc = target; loc; loc = PREV_INSN (loc))
3246                   if (BARRIER_P (loc)
3247                       /* Don't move things inside a tablejump.  */
3248                       && ((loc2 = next_nonnote_insn (loc)) == 0
3249                           || !LABEL_P (loc2)
3250                           || (loc2 = next_nonnote_insn (loc2)) == 0
3251                           || !JUMP_P (loc2)
3252                           || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
3253                               && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
3254                       && uid_loop[INSN_UID (loc)] == target_loop)
3255                     break;
3256
3257                 if (loc == 0)
3258                   for (loc = target; loc; loc = NEXT_INSN (loc))
3259                     if (BARRIER_P (loc)
3260                         /* Don't move things inside a tablejump.  */
3261                         && ((loc2 = next_nonnote_insn (loc)) == 0
3262                             || !LABEL_P (loc2)
3263                             || (loc2 = next_nonnote_insn (loc2)) == 0
3264                             || !JUMP_P (loc2)
3265                             || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
3266                                 && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
3267                         && uid_loop[INSN_UID (loc)] == target_loop)
3268                       break;
3269
3270                 if (loc)
3271                   {
3272                     rtx cond_label = JUMP_LABEL (p);
3273                     rtx new_label = get_label_after (p);
3274
3275                     /* Ensure our label doesn't go away.  */
3276                     LABEL_NUSES (cond_label)++;
3277
3278                     /* Verify that uid_loop is large enough and that
3279                        we can invert P.  */
3280                     if (invert_jump (p, new_label, 1))
3281                       {
3282                         rtx q, r;
3283                         bool only_notes;
3284
3285                         /* If no suitable BARRIER was found, create a suitable
3286                            one before TARGET.  Since TARGET is a fall through
3287                            path, we'll need to insert a jump around our block
3288                            and add a BARRIER before TARGET.
3289
3290                            This creates an extra unconditional jump outside
3291                            the loop.  However, the benefits of removing rarely
3292                            executed instructions from inside the loop usually
3293                            outweighs the cost of the extra unconditional jump
3294                            outside the loop.  */
3295                         if (loc == 0)
3296                           {
3297                             rtx temp;
3298
3299                             temp = gen_jump (JUMP_LABEL (insn));
3300                             temp = emit_jump_insn_before (temp, target);
3301                             JUMP_LABEL (temp) = JUMP_LABEL (insn);
3302                             LABEL_NUSES (JUMP_LABEL (insn))++;
3303                             loc = emit_barrier_before (target);
3304                           }
3305
3306                         /* Include the BARRIER after INSN and copy the
3307                            block after LOC.  */
3308                         only_notes = squeeze_notes (&new_label,
3309                                                     &last_insn_to_move);
3310                         gcc_assert (!only_notes);
3311
3312                         reorder_insns (new_label, last_insn_to_move, loc);
3313
3314                         /* All those insns are now in TARGET_LOOP.  */
3315                         for (q = new_label;
3316                              q != NEXT_INSN (last_insn_to_move);
3317                              q = NEXT_INSN (q))
3318                           uid_loop[INSN_UID (q)] = target_loop;
3319
3320                         /* The label jumped to by INSN is no longer a loop
3321                            exit.  Unless INSN does not have a label (e.g.,
3322                            it is a RETURN insn), search loop->exit_labels
3323                            to find its label_ref, and remove it.  Also turn
3324                            off LABEL_OUTSIDE_LOOP_P bit.  */
3325                         if (JUMP_LABEL (insn))
3326                           {
3327                             for (q = 0, r = this_loop->exit_labels;
3328                                  r;
3329                                  q = r, r = LABEL_NEXTREF (r))
3330                               if (XEXP (r, 0) == JUMP_LABEL (insn))
3331                                 {
3332                                   LABEL_OUTSIDE_LOOP_P (r) = 0;
3333                                   if (q)
3334                                     LABEL_NEXTREF (q) = LABEL_NEXTREF (r);
3335                                   else
3336                                     this_loop->exit_labels = LABEL_NEXTREF (r);
3337                                   break;
3338                                 }
3339
3340                             for (loop = this_loop; loop && loop != target_loop;
3341                                  loop = loop->outer)
3342                               loop->exit_count--;
3343
3344                             /* If we didn't find it, then something is
3345                                wrong.  */
3346                             gcc_assert (r);
3347                           }
3348
3349                         /* P is now a jump outside the loop, so it must be put
3350                            in loop->exit_labels, and marked as such.
3351                            The easiest way to do this is to just call
3352                            mark_loop_jump again for P.  */
3353                         mark_loop_jump (PATTERN (p), this_loop);
3354
3355                         /* If INSN now jumps to the insn after it,
3356                            delete INSN.  */
3357                         if (JUMP_LABEL (insn) != 0
3358                             && (next_real_insn (JUMP_LABEL (insn))
3359                                 == next_real_insn (insn)))
3360                           delete_related_insns (insn);
3361                       }
3362
3363                     /* Continue the loop after where the conditional
3364                        branch used to jump, since the only branch insn
3365                        in the block (if it still remains) is an inter-loop
3366                        branch and hence needs no processing.  */
3367                     insn = NEXT_INSN (cond_label);
3368
3369                     if (--LABEL_NUSES (cond_label) == 0)
3370                       delete_related_insns (cond_label);
3371
3372                     /* This loop will be continued with NEXT_INSN (insn).  */
3373                     insn = PREV_INSN (insn);
3374                   }
3375               }
3376           }
3377       }
3378 }
3379
3380 /* If any label in X jumps to a loop different from LOOP_NUM and any of the
3381    loops it is contained in, mark the target loop invalid.
3382
3383    For speed, we assume that X is part of a pattern of a JUMP_INSN.  */
3384
3385 static void
3386 mark_loop_jump (rtx x, struct loop *loop)
3387 {
3388   struct loop *dest_loop;
3389   struct loop *outer_loop;
3390   int i;
3391
3392   switch (GET_CODE (x))
3393     {
3394     case PC:
3395     case USE:
3396     case CLOBBER:
3397     case REG:
3398     case MEM:
3399     case CONST_INT:
3400     case CONST_DOUBLE:
3401     case RETURN:
3402       return;
3403
3404     case CONST:
3405       /* There could be a label reference in here.  */
3406       mark_loop_jump (XEXP (x, 0), loop);
3407       return;
3408
3409     case PLUS:
3410     case MINUS:
3411     case MULT:
3412       mark_loop_jump (XEXP (x, 0), loop);
3413       mark_loop_jump (XEXP (x, 1), loop);
3414       return;
3415
3416     case LO_SUM:
3417       /* This may refer to a LABEL_REF or SYMBOL_REF.  */
3418       mark_loop_jump (XEXP (x, 1), loop);
3419       return;
3420
3421     case SIGN_EXTEND:
3422     case ZERO_EXTEND:
3423       mark_loop_jump (XEXP (x, 0), loop);
3424       return;
3425
3426     case LABEL_REF:
3427       dest_loop = uid_loop[INSN_UID (XEXP (x, 0))];
3428
3429       /* Link together all labels that branch outside the loop.  This
3430          is used by final_[bg]iv_value and the loop unrolling code.  Also
3431          mark this LABEL_REF so we know that this branch should predict
3432          false.  */
3433
3434       /* A check to make sure the label is not in an inner nested loop,
3435          since this does not count as a loop exit.  */
3436       if (dest_loop)
3437         {
3438           for (outer_loop = dest_loop; outer_loop;
3439                outer_loop = outer_loop->outer)
3440             if (outer_loop == loop)
3441               break;
3442         }
3443       else
3444         outer_loop = NULL;
3445
3446       if (loop && ! outer_loop)
3447         {
3448           LABEL_OUTSIDE_LOOP_P (x) = 1;
3449           LABEL_NEXTREF (x) = loop->exit_labels;
3450           loop->exit_labels = x;
3451
3452           for (outer_loop = loop;
3453                outer_loop && outer_loop != dest_loop;
3454                outer_loop = outer_loop->outer)
3455             outer_loop->exit_count++;
3456         }
3457
3458       /* If this is inside a loop, but not in the current loop or one enclosed
3459          by it, it invalidates at least one loop.  */
3460
3461       if (! dest_loop)
3462         return;
3463
3464       /* We must invalidate every nested loop containing the target of this
3465          label, except those that also contain the jump insn.  */
3466
3467       for (; dest_loop; dest_loop = dest_loop->outer)
3468         {
3469           /* Stop when we reach a loop that also contains the jump insn.  */
3470           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3471             if (dest_loop == outer_loop)
3472               return;
3473
3474           /* If we get here, we know we need to invalidate a loop.  */
3475           if (loop_dump_stream && ! dest_loop->invalid)
3476             fprintf (loop_dump_stream,
3477                      "\nLoop at %d ignored due to multiple entry points.\n",
3478                      INSN_UID (dest_loop->start));
3479
3480           dest_loop->invalid = 1;
3481         }
3482       return;
3483
3484     case SET:
3485       /* If this is not setting pc, ignore.  */
3486       if (SET_DEST (x) == pc_rtx)
3487         mark_loop_jump (SET_SRC (x), loop);
3488       return;
3489
3490     case IF_THEN_ELSE:
3491       mark_loop_jump (XEXP (x, 1), loop);
3492       mark_loop_jump (XEXP (x, 2), loop);
3493       return;
3494
3495     case PARALLEL:
3496     case ADDR_VEC:
3497       for (i = 0; i < XVECLEN (x, 0); i++)
3498         mark_loop_jump (XVECEXP (x, 0, i), loop);
3499       return;
3500
3501     case ADDR_DIFF_VEC:
3502       for (i = 0; i < XVECLEN (x, 1); i++)
3503         mark_loop_jump (XVECEXP (x, 1, i), loop);
3504       return;
3505
3506     default:
3507       /* Strictly speaking this is not a jump into the loop, only a possible
3508          jump out of the loop.  However, we have no way to link the destination
3509          of this jump onto the list of exit labels.  To be safe we mark this
3510          loop and any containing loops as invalid.  */
3511       if (loop)
3512         {
3513           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3514             {
3515               if (loop_dump_stream && ! outer_loop->invalid)
3516                 fprintf (loop_dump_stream,
3517                          "\nLoop at %d ignored due to unknown exit jump.\n",
3518                          INSN_UID (outer_loop->start));
3519               outer_loop->invalid = 1;
3520             }
3521         }
3522       return;
3523     }
3524 }
3525 \f
3526 /* Return nonzero if there is a label in the range from
3527    insn INSN to and including the insn whose luid is END
3528    INSN must have an assigned luid (i.e., it must not have
3529    been previously created by loop.c).  */
3530
3531 static int
3532 labels_in_range_p (rtx insn, int end)
3533 {
3534   while (insn && INSN_LUID (insn) <= end)
3535     {
3536       if (LABEL_P (insn))
3537         return 1;
3538       insn = NEXT_INSN (insn);
3539     }
3540
3541   return 0;
3542 }
3543
3544 /* Record that a memory reference X is being set.  */
3545
3546 static void
3547 note_addr_stored (rtx x, rtx y ATTRIBUTE_UNUSED,
3548                   void *data ATTRIBUTE_UNUSED)
3549 {
3550   struct loop_info *loop_info = data;
3551
3552   if (x == 0 || !MEM_P (x))
3553     return;
3554
3555   /* Count number of memory writes.
3556      This affects heuristics in strength_reduce.  */
3557   loop_info->num_mem_sets++;
3558
3559   /* BLKmode MEM means all memory is clobbered.  */
3560   if (GET_MODE (x) == BLKmode)
3561     {
3562       if (MEM_READONLY_P (x))
3563         loop_info->unknown_constant_address_altered = 1;
3564       else
3565         loop_info->unknown_address_altered = 1;
3566
3567       return;
3568     }
3569
3570   loop_info->store_mems = gen_rtx_EXPR_LIST (VOIDmode, x,
3571                                              loop_info->store_mems);
3572 }
3573
3574 /* X is a value modified by an INSN that references a biv inside a loop
3575    exit test (i.e., X is somehow related to the value of the biv).  If X
3576    is a pseudo that is used more than once, then the biv is (effectively)
3577    used more than once.  DATA is a pointer to a loop_regs structure.  */
3578
3579 static void
3580 note_set_pseudo_multiple_uses (rtx x, rtx y ATTRIBUTE_UNUSED, void *data)
3581 {
3582   struct loop_regs *regs = (struct loop_regs *) data;
3583
3584   if (x == 0)
3585     return;
3586
3587   while (GET_CODE (x) == STRICT_LOW_PART
3588          || GET_CODE (x) == SIGN_EXTRACT
3589          || GET_CODE (x) == ZERO_EXTRACT
3590          || GET_CODE (x) == SUBREG)
3591     x = XEXP (x, 0);
3592
3593   if (!REG_P (x) || REGNO (x) < FIRST_PSEUDO_REGISTER)
3594     return;
3595
3596   /* If we do not have usage information, or if we know the register
3597      is used more than once, note that fact for check_dbra_loop.  */
3598   if (REGNO (x) >= max_reg_before_loop
3599       || ! regs->array[REGNO (x)].single_usage
3600       || regs->array[REGNO (x)].single_usage == const0_rtx)
3601     regs->multiple_uses = 1;
3602 }
3603 \f
3604 /* Return nonzero if the rtx X is invariant over the current loop.
3605
3606    The value is 2 if we refer to something only conditionally invariant.
3607
3608    A memory ref is invariant if it is not volatile and does not conflict
3609    with anything stored in `loop_info->store_mems'.  */
3610
3611 static int
3612 loop_invariant_p (const struct loop *loop, rtx x)
3613 {
3614   struct loop_info *loop_info = LOOP_INFO (loop);
3615   struct loop_regs *regs = LOOP_REGS (loop);
3616   int i;
3617   enum rtx_code code;
3618   const char *fmt;
3619   int conditional = 0;
3620   rtx mem_list_entry;
3621
3622   if (x == 0)
3623     return 1;
3624   code = GET_CODE (x);
3625   switch (code)
3626     {
3627     case CONST_INT:
3628     case CONST_DOUBLE:
3629     case SYMBOL_REF:
3630     case CONST:
3631       return 1;
3632
3633     case LABEL_REF:
3634       return 1;
3635
3636     case PC:
3637     case CC0:
3638     case UNSPEC_VOLATILE:
3639       return 0;
3640
3641     case REG:
3642       if ((x == frame_pointer_rtx || x == hard_frame_pointer_rtx
3643            || x == arg_pointer_rtx || x == pic_offset_table_rtx)
3644           && ! current_function_has_nonlocal_goto)
3645         return 1;
3646
3647       if (LOOP_INFO (loop)->has_call
3648           && REGNO (x) < FIRST_PSEUDO_REGISTER
3649           && TEST_HARD_REG_BIT (regs_invalidated_by_call, REGNO (x)))
3650         return 0;
3651
3652       /* Out-of-range regs can occur when we are called from unrolling.
3653          These registers created by the unroller are set in the loop,
3654          hence are never invariant.
3655          Other out-of-range regs can be generated by load_mems; those that
3656          are written to in the loop are not invariant, while those that are
3657          not written to are invariant.  It would be easy for load_mems
3658          to set n_times_set correctly for these registers, however, there
3659          is no easy way to distinguish them from registers created by the
3660          unroller.  */
3661
3662       if (REGNO (x) >= (unsigned) regs->num)
3663         return 0;
3664
3665       if (regs->array[REGNO (x)].set_in_loop < 0)
3666         return 2;
3667
3668       return regs->array[REGNO (x)].set_in_loop == 0;
3669
3670     case MEM:
3671       /* Volatile memory references must be rejected.  Do this before
3672          checking for read-only items, so that volatile read-only items
3673          will be rejected also.  */
3674       if (MEM_VOLATILE_P (x))
3675         return 0;
3676
3677       /* See if there is any dependence between a store and this load.  */
3678       mem_list_entry = loop_info->store_mems;
3679       while (mem_list_entry)
3680         {
3681           if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
3682                                x, rtx_varies_p))
3683             return 0;
3684
3685           mem_list_entry = XEXP (mem_list_entry, 1);
3686         }
3687
3688       /* It's not invalidated by a store in memory
3689          but we must still verify the address is invariant.  */
3690       break;
3691
3692     case ASM_OPERANDS:
3693       /* Don't mess with insns declared volatile.  */
3694       if (MEM_VOLATILE_P (x))
3695         return 0;
3696       break;
3697
3698     default:
3699       break;
3700     }
3701
3702   fmt = GET_RTX_FORMAT (code);
3703   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3704     {
3705       if (fmt[i] == 'e')
3706         {
3707           int tem = loop_invariant_p (loop, XEXP (x, i));
3708           if (tem == 0)
3709             return 0;
3710           if (tem == 2)
3711             conditional = 1;
3712         }
3713       else if (fmt[i] == 'E')
3714         {
3715           int j;
3716           for (j = 0; j < XVECLEN (x, i); j++)
3717             {
3718               int tem = loop_invariant_p (loop, XVECEXP (x, i, j));
3719               if (tem == 0)
3720                 return 0;
3721               if (tem == 2)
3722                 conditional = 1;
3723             }
3724
3725         }
3726     }
3727
3728   return 1 + conditional;
3729 }
3730 \f
3731 /* Return nonzero if all the insns in the loop that set REG
3732    are INSN and the immediately following insns,
3733    and if each of those insns sets REG in an invariant way
3734    (not counting uses of REG in them).
3735
3736    The value is 2 if some of these insns are only conditionally invariant.
3737
3738    We assume that INSN itself is the first set of REG
3739    and that its source is invariant.  */
3740
3741 static int
3742 consec_sets_invariant_p (const struct loop *loop, rtx reg, int n_sets,
3743                          rtx insn)
3744 {
3745   struct loop_regs *regs = LOOP_REGS (loop);
3746   rtx p = insn;
3747   unsigned int regno = REGNO (reg);
3748   rtx temp;
3749   /* Number of sets we have to insist on finding after INSN.  */
3750   int count = n_sets - 1;
3751   int old = regs->array[regno].set_in_loop;
3752   int value = 0;
3753   int this;
3754
3755   /* If N_SETS hit the limit, we can't rely on its value.  */
3756   if (n_sets == 127)
3757     return 0;
3758
3759   regs->array[regno].set_in_loop = 0;
3760
3761   while (count > 0)
3762     {
3763       enum rtx_code code;
3764       rtx set;
3765
3766       p = NEXT_INSN (p);
3767       code = GET_CODE (p);
3768
3769       /* If library call, skip to end of it.  */
3770       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
3771         p = XEXP (temp, 0);
3772
3773       this = 0;
3774       if (code == INSN
3775           && (set = single_set (p))
3776           && REG_P (SET_DEST (set))
3777           && REGNO (SET_DEST (set)) == regno)
3778         {
3779           this = loop_invariant_p (loop, SET_SRC (set));
3780           if (this != 0)
3781             value |= this;
3782           else if ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX)))
3783             {
3784               /* If this is a libcall, then any invariant REG_EQUAL note is OK.
3785                  If this is an ordinary insn, then only CONSTANT_P REG_EQUAL
3786                  notes are OK.  */
3787               this = (CONSTANT_P (XEXP (temp, 0))
3788                       || (find_reg_note (p, REG_RETVAL, NULL_RTX)
3789                           && loop_invariant_p (loop, XEXP (temp, 0))));
3790               if (this != 0)
3791                 value |= this;
3792             }
3793         }
3794       if (this != 0)
3795         count--;
3796       else if (code != NOTE)
3797         {
3798           regs->array[regno].set_in_loop = old;
3799           return 0;
3800         }
3801     }
3802
3803   regs->array[regno].set_in_loop = old;
3804   /* If loop_invariant_p ever returned 2, we return 2.  */
3805   return 1 + (value & 2);
3806 }
3807 \f
3808 /* Look at all uses (not sets) of registers in X.  For each, if it is
3809    the single use, set USAGE[REGNO] to INSN; if there was a previous use in
3810    a different insn, set USAGE[REGNO] to const0_rtx.  */
3811
3812 static void
3813 find_single_use_in_loop (struct loop_regs *regs, rtx insn, rtx x)
3814 {
3815   enum rtx_code code = GET_CODE (x);
3816   const char *fmt = GET_RTX_FORMAT (code);
3817   int i, j;
3818
3819   if (code == REG)
3820     regs->array[REGNO (x)].single_usage
3821       = (regs->array[REGNO (x)].single_usage != 0
3822          && regs->array[REGNO (x)].single_usage != insn)
3823         ? const0_rtx : insn;
3824
3825   else if (code == SET)
3826     {
3827       /* Don't count SET_DEST if it is a REG; otherwise count things
3828          in SET_DEST because if a register is partially modified, it won't
3829          show up as a potential movable so we don't care how USAGE is set
3830          for it.  */
3831       if (!REG_P (SET_DEST (x)))
3832         find_single_use_in_loop (regs, insn, SET_DEST (x));
3833       find_single_use_in_loop (regs, insn, SET_SRC (x));
3834     }
3835   else
3836     for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3837       {
3838         if (fmt[i] == 'e' && XEXP (x, i) != 0)
3839           find_single_use_in_loop (regs, insn, XEXP (x, i));
3840         else if (fmt[i] == 'E')
3841           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
3842             find_single_use_in_loop (regs, insn, XVECEXP (x, i, j));
3843       }
3844 }
3845 \f
3846 /* Count and record any set in X which is contained in INSN.  Update
3847    REGS->array[I].MAY_NOT_OPTIMIZE and LAST_SET for any register I set
3848    in X.  */
3849
3850 static void
3851 count_one_set (struct loop_regs *regs, rtx insn, rtx x, rtx *last_set)
3852 {
3853   if (GET_CODE (x) == CLOBBER && REG_P (XEXP (x, 0)))
3854     /* Don't move a reg that has an explicit clobber.
3855        It's not worth the pain to try to do it correctly.  */
3856     regs->array[REGNO (XEXP (x, 0))].may_not_optimize = 1;
3857
3858   if (GET_CODE (x) == SET || GET_CODE (x) == CLOBBER)
3859     {
3860       rtx dest = SET_DEST (x);
3861       while (GET_CODE (dest) == SUBREG
3862              || GET_CODE (dest) == ZERO_EXTRACT
3863              || GET_CODE (dest) == STRICT_LOW_PART)
3864         dest = XEXP (dest, 0);
3865       if (REG_P (dest))
3866         {
3867           int i;
3868           int regno = REGNO (dest);
3869           for (i = 0; i < LOOP_REGNO_NREGS (regno, dest); i++)
3870             {
3871               /* If this is the first setting of this reg
3872                  in current basic block, and it was set before,
3873                  it must be set in two basic blocks, so it cannot
3874                  be moved out of the loop.  */
3875               if (regs->array[regno].set_in_loop > 0
3876                   && last_set[regno] == 0)
3877                 regs->array[regno+i].may_not_optimize = 1;
3878               /* If this is not first setting in current basic block,
3879                  see if reg was used in between previous one and this.
3880                  If so, neither one can be moved.  */
3881               if (last_set[regno] != 0
3882                   && reg_used_between_p (dest, last_set[regno], insn))
3883                 regs->array[regno+i].may_not_optimize = 1;
3884               if (regs->array[regno+i].set_in_loop < 127)
3885                 ++regs->array[regno+i].set_in_loop;
3886               last_set[regno+i] = insn;
3887             }
3888         }
3889     }
3890 }
3891 \f
3892 /* Given a loop that is bounded by LOOP->START and LOOP->END and that
3893    is entered at LOOP->SCAN_START, return 1 if the register set in SET
3894    contained in insn INSN is used by any insn that precedes INSN in
3895    cyclic order starting from the loop entry point.
3896
3897    We don't want to use INSN_LUID here because if we restrict INSN to those
3898    that have a valid INSN_LUID, it means we cannot move an invariant out
3899    from an inner loop past two loops.  */
3900
3901 static int
3902 loop_reg_used_before_p (const struct loop *loop, rtx set, rtx insn)
3903 {
3904   rtx reg = SET_DEST (set);
3905   rtx p;
3906
3907   /* Scan forward checking for register usage.  If we hit INSN, we
3908      are done.  Otherwise, if we hit LOOP->END, wrap around to LOOP->START.  */
3909   for (p = loop->scan_start; p != insn; p = NEXT_INSN (p))
3910     {
3911       if (INSN_P (p) && reg_overlap_mentioned_p (reg, PATTERN (p)))
3912         return 1;
3913
3914       if (p == loop->end)
3915         p = loop->start;
3916     }
3917
3918   return 0;
3919 }
3920 \f
3921
3922 /* Information we collect about arrays that we might want to prefetch.  */
3923 struct prefetch_info
3924 {
3925   struct iv_class *class;       /* Class this prefetch is based on.  */
3926   struct induction *giv;        /* GIV this prefetch is based on.  */
3927   rtx base_address;             /* Start prefetching from this address plus
3928                                    index.  */
3929   HOST_WIDE_INT index;
3930   HOST_WIDE_INT stride;         /* Prefetch stride in bytes in each
3931                                    iteration.  */
3932   unsigned int bytes_accessed;  /* Sum of sizes of all accesses to this
3933                                    prefetch area in one iteration.  */
3934   unsigned int total_bytes;     /* Total bytes loop will access in this block.
3935                                    This is set only for loops with known
3936                                    iteration counts and is 0xffffffff
3937                                    otherwise.  */
3938   int prefetch_in_loop;         /* Number of prefetch insns in loop.  */
3939   int prefetch_before_loop;     /* Number of prefetch insns before loop.  */
3940   unsigned int write : 1;       /* 1 for read/write prefetches.  */
3941 };
3942
3943 /* Data used by check_store function.  */
3944 struct check_store_data
3945 {
3946   rtx mem_address;
3947   int mem_write;
3948 };
3949
3950 static void check_store (rtx, rtx, void *);
3951 static void emit_prefetch_instructions (struct loop *);
3952 static int rtx_equal_for_prefetch_p (rtx, rtx);
3953
3954 /* Set mem_write when mem_address is found.  Used as callback to
3955    note_stores.  */
3956 static void
3957 check_store (rtx x, rtx pat ATTRIBUTE_UNUSED, void *data)
3958 {
3959   struct check_store_data *d = (struct check_store_data *) data;
3960
3961   if ((MEM_P (x)) && rtx_equal_p (d->mem_address, XEXP (x, 0)))
3962     d->mem_write = 1;
3963 }
3964 \f
3965 /* Like rtx_equal_p, but attempts to swap commutative operands.  This is
3966    important to get some addresses combined.  Later more sophisticated
3967    transformations can be added when necessary.
3968
3969    ??? Same trick with swapping operand is done at several other places.
3970    It can be nice to develop some common way to handle this.  */
3971
3972 static int
3973 rtx_equal_for_prefetch_p (rtx x, rtx y)
3974 {
3975   int i;
3976   int j;
3977   enum rtx_code code = GET_CODE (x);
3978   const char *fmt;
3979
3980   if (x == y)
3981     return 1;
3982   if (code != GET_CODE (y))
3983     return 0;
3984
3985   if (COMMUTATIVE_ARITH_P (x))
3986     {
3987       return ((rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 0))
3988                && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 1)))
3989               || (rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 1))
3990                   && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 0))));
3991     }
3992
3993   /* Compare the elements.  If any pair of corresponding elements fails to
3994      match, return 0 for the whole thing.  */
3995
3996   fmt = GET_RTX_FORMAT (code);
3997   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3998     {
3999       switch (fmt[i])
4000         {
4001         case 'w':
4002           if (XWINT (x, i) != XWINT (y, i))
4003             return 0;
4004           break;
4005
4006         case 'i':
4007           if (XINT (x, i) != XINT (y, i))
4008             return 0;
4009           break;
4010
4011         case 'E':
4012           /* Two vectors must have the same length.  */
4013           if (XVECLEN (x, i) != XVECLEN (y, i))
4014             return 0;
4015
4016           /* And the corresponding elements must match.  */
4017           for (j = 0; j < XVECLEN (x, i); j++)
4018             if (rtx_equal_for_prefetch_p (XVECEXP (x, i, j),
4019                                           XVECEXP (y, i, j)) == 0)
4020               return 0;
4021           break;
4022
4023         case 'e':
4024           if (rtx_equal_for_prefetch_p (XEXP (x, i), XEXP (y, i)) == 0)
4025             return 0;
4026           break;
4027
4028         case 's':
4029           if (strcmp (XSTR (x, i), XSTR (y, i)))
4030             return 0;
4031           break;
4032
4033         case 'u':
4034           /* These are just backpointers, so they don't matter.  */
4035           break;
4036
4037         case '0':
4038           break;
4039
4040           /* It is believed that rtx's at this level will never
4041              contain anything but integers and other rtx's,
4042              except for within LABEL_REFs and SYMBOL_REFs.  */
4043         default:
4044           gcc_unreachable ();
4045         }
4046     }
4047   return 1;
4048 }
4049 \f
4050 /* Remove constant addition value from the expression X (when present)
4051    and return it.  */
4052
4053 static HOST_WIDE_INT
4054 remove_constant_addition (rtx *x)
4055 {
4056   HOST_WIDE_INT addval = 0;
4057   rtx exp = *x;
4058
4059   /* Avoid clobbering a shared CONST expression.  */
4060   if (GET_CODE (exp) == CONST)
4061     {
4062       if (GET_CODE (XEXP (exp, 0)) == PLUS
4063           && GET_CODE (XEXP (XEXP (exp, 0), 0)) == SYMBOL_REF
4064           && GET_CODE (XEXP (XEXP (exp, 0), 1)) == CONST_INT)
4065         {
4066           *x = XEXP (XEXP (exp, 0), 0);
4067           return INTVAL (XEXP (XEXP (exp, 0), 1));
4068         }
4069       return 0;
4070     }
4071
4072   if (GET_CODE (exp) == CONST_INT)
4073     {
4074       addval = INTVAL (exp);
4075       *x = const0_rtx;
4076     }
4077
4078   /* For plus expression recurse on ourself.  */
4079   else if (GET_CODE (exp) == PLUS)
4080     {
4081       addval += remove_constant_addition (&XEXP (exp, 0));
4082       addval += remove_constant_addition (&XEXP (exp, 1));
4083
4084       /* In case our parameter was constant, remove extra zero from the
4085          expression.  */
4086       if (XEXP (exp, 0) == const0_rtx)
4087         *x = XEXP (exp, 1);
4088       else if (XEXP (exp, 1) == const0_rtx)
4089         *x = XEXP (exp, 0);
4090     }
4091
4092   return addval;
4093 }
4094
4095 /* Attempt to identify accesses to arrays that are most likely to cause cache
4096    misses, and emit prefetch instructions a few prefetch blocks forward.
4097
4098    To detect the arrays we use the GIV information that was collected by the
4099    strength reduction pass.
4100
4101    The prefetch instructions are generated after the GIV information is done
4102    and before the strength reduction process. The new GIVs are injected into
4103    the strength reduction tables, so the prefetch addresses are optimized as
4104    well.
4105
4106    GIVs are split into base address, stride, and constant addition values.
4107    GIVs with the same address, stride and close addition values are combined
4108    into a single prefetch.  Also writes to GIVs are detected, so that prefetch
4109    for write instructions can be used for the block we write to, on machines
4110    that support write prefetches.
4111
4112    Several heuristics are used to determine when to prefetch.  They are
4113    controlled by defined symbols that can be overridden for each target.  */
4114
4115 static void
4116 emit_prefetch_instructions (struct loop *loop)
4117 {
4118   int num_prefetches = 0;
4119   int num_real_prefetches = 0;
4120   int num_real_write_prefetches = 0;
4121   int num_prefetches_before = 0;
4122   int num_write_prefetches_before = 0;
4123   int ahead = 0;
4124   int i;
4125   struct iv_class *bl;
4126   struct induction *iv;
4127   struct prefetch_info info[MAX_PREFETCHES];
4128   struct loop_ivs *ivs = LOOP_IVS (loop);
4129
4130   if (!HAVE_prefetch || PREFETCH_BLOCK == 0)
4131     return;
4132
4133   /* Consider only loops w/o calls.  When a call is done, the loop is probably
4134      slow enough to read the memory.  */
4135   if (PREFETCH_NO_CALL && LOOP_INFO (loop)->has_call)
4136     {
4137       if (loop_dump_stream)
4138         fprintf (loop_dump_stream, "Prefetch: ignoring loop: has call.\n");
4139
4140       return;
4141     }
4142
4143   /* Don't prefetch in loops known to have few iterations.  */
4144   if (PREFETCH_NO_LOW_LOOPCNT
4145       && LOOP_INFO (loop)->n_iterations
4146       && LOOP_INFO (loop)->n_iterations <= PREFETCH_LOW_LOOPCNT)
4147     {
4148       if (loop_dump_stream)
4149         fprintf (loop_dump_stream,
4150                  "Prefetch: ignoring loop: not enough iterations.\n");
4151       return;
4152     }
4153
4154   /* Search all induction variables and pick those interesting for the prefetch
4155      machinery.  */
4156   for (bl = ivs->list; bl; bl = bl->next)
4157     {
4158       struct induction *biv = bl->biv, *biv1;
4159       int basestride = 0;
4160
4161       biv1 = biv;
4162
4163       /* Expect all BIVs to be executed in each iteration.  This makes our
4164          analysis more conservative.  */
4165       while (biv1)
4166         {
4167           /* Discard non-constant additions that we can't handle well yet, and
4168              BIVs that are executed multiple times; such BIVs ought to be
4169              handled in the nested loop.  We accept not_every_iteration BIVs,
4170              since these only result in larger strides and make our
4171              heuristics more conservative.  */
4172           if (GET_CODE (biv->add_val) != CONST_INT)
4173             {
4174               if (loop_dump_stream)
4175                 {
4176                   fprintf (loop_dump_stream,
4177                     "Prefetch: ignoring biv %d: non-constant addition at insn %d:",
4178                            REGNO (biv->src_reg), INSN_UID (biv->insn));
4179                   print_rtl (loop_dump_stream, biv->add_val);
4180                   fprintf (loop_dump_stream, "\n");
4181                 }
4182               break;
4183             }
4184
4185           if (biv->maybe_multiple)
4186             {
4187               if (loop_dump_stream)
4188                 {
4189                   fprintf (loop_dump_stream,
4190                            "Prefetch: ignoring biv %d: maybe_multiple at insn %i:",
4191                            REGNO (biv->src_reg), INSN_UID (biv->insn));
4192                   print_rtl (loop_dump_stream, biv->add_val);
4193                   fprintf (loop_dump_stream, "\n");
4194                 }
4195               break;
4196             }
4197
4198           basestride += INTVAL (biv1->add_val);
4199           biv1 = biv1->next_iv;
4200         }
4201
4202       if (biv1 || !basestride)
4203         continue;
4204
4205       for (iv = bl->giv; iv; iv = iv->next_iv)
4206         {
4207           rtx address;
4208           rtx temp;
4209           HOST_WIDE_INT index = 0;
4210           int add = 1;
4211           HOST_WIDE_INT stride = 0;
4212           int stride_sign = 1;
4213           struct check_store_data d;
4214           const char *ignore_reason = NULL;
4215           int size = GET_MODE_SIZE (GET_MODE (iv));
4216
4217           /* See whether an induction variable is interesting to us and if
4218              not, report the reason.  */
4219           if (iv->giv_type != DEST_ADDR)
4220             ignore_reason = "giv is not a destination address";
4221
4222           /* We are interested only in constant stride memory references
4223              in order to be able to compute density easily.  */
4224           else if (GET_CODE (iv->mult_val) != CONST_INT)
4225             ignore_reason = "stride is not constant";
4226
4227           else
4228             {
4229               stride = INTVAL (iv->mult_val) * basestride;
4230               if (stride < 0)
4231                 {
4232                   stride = -stride;
4233                   stride_sign = -1;
4234                 }
4235
4236               /* On some targets, reversed order prefetches are not
4237                  worthwhile.  */
4238               if (PREFETCH_NO_REVERSE_ORDER && stride_sign < 0)
4239                 ignore_reason = "reversed order stride";
4240
4241               /* Prefetch of accesses with an extreme stride might not be
4242                  worthwhile, either.  */
4243               else if (PREFETCH_NO_EXTREME_STRIDE
4244                        && stride > PREFETCH_EXTREME_STRIDE)
4245                 ignore_reason = "extreme stride";
4246
4247               /* Ignore GIVs with varying add values; we can't predict the
4248                  value for the next iteration.  */
4249               else if (!loop_invariant_p (loop, iv->add_val))
4250                 ignore_reason = "giv has varying add value";
4251
4252               /* Ignore GIVs in the nested loops; they ought to have been
4253                  handled already.  */
4254               else if (iv->maybe_multiple)
4255                 ignore_reason = "giv is in nested loop";
4256             }
4257
4258           if (ignore_reason != NULL)
4259             {
4260               if (loop_dump_stream)
4261                 fprintf (loop_dump_stream,
4262                          "Prefetch: ignoring giv at %d: %s.\n",
4263                          INSN_UID (iv->insn), ignore_reason);
4264               continue;
4265             }
4266
4267           /* Determine the pointer to the basic array we are examining.  It is
4268              the sum of the BIV's initial value and the GIV's add_val.  */
4269           address = copy_rtx (iv->add_val);
4270           temp = copy_rtx (bl->initial_value);
4271
4272           address = simplify_gen_binary (PLUS, Pmode, temp, address);
4273           index = remove_constant_addition (&address);
4274
4275           d.mem_write = 0;
4276           d.mem_address = *iv->location;
4277
4278           /* When the GIV is not always executed, we might be better off by
4279              not dirtying the cache pages.  */
4280           if (PREFETCH_CONDITIONAL || iv->always_executed)
4281             note_stores (PATTERN (iv->insn), check_store, &d);
4282           else
4283             {
4284               if (loop_dump_stream)
4285                 fprintf (loop_dump_stream, "Prefetch: Ignoring giv at %d: %s\n",
4286                          INSN_UID (iv->insn), "in conditional code.");
4287               continue;
4288             }
4289
4290           /* Attempt to find another prefetch to the same array and see if we
4291              can merge this one.  */
4292           for (i = 0; i < num_prefetches; i++)
4293             if (rtx_equal_for_prefetch_p (address, info[i].base_address)
4294                 && stride == info[i].stride)
4295               {
4296                 /* In case both access same array (same location
4297                    just with small difference in constant indexes), merge
4298                    the prefetches.  Just do the later and the earlier will
4299                    get prefetched from previous iteration.
4300                    The artificial threshold should not be too small,
4301                    but also not bigger than small portion of memory usually
4302                    traversed by single loop.  */
4303                 if (index >= info[i].index
4304                     && index - info[i].index < PREFETCH_EXTREME_DIFFERENCE)
4305                   {
4306                     info[i].write |= d.mem_write;
4307                     info[i].bytes_accessed += size;
4308                     info[i].index = index;
4309                     info[i].giv = iv;
4310                     info[i].class = bl;
4311                     info[num_prefetches].base_address = address;
4312                     add = 0;
4313                     break;
4314                   }
4315
4316                 if (index < info[i].index
4317                     && info[i].index - index < PREFETCH_EXTREME_DIFFERENCE)
4318                   {
4319                     info[i].write |= d.mem_write;
4320                     info[i].bytes_accessed += size;
4321                     add = 0;
4322                     break;
4323                   }
4324               }
4325
4326           /* Merging failed.  */
4327           if (add)
4328             {
4329               info[num_prefetches].giv = iv;
4330               info[num_prefetches].class = bl;
4331               info[num_prefetches].index = index;
4332               info[num_prefetches].stride = stride;
4333               info[num_prefetches].base_address = address;
4334               info[num_prefetches].write = d.mem_write;
4335               info[num_prefetches].bytes_accessed = size;
4336               num_prefetches++;
4337               if (num_prefetches >= MAX_PREFETCHES)
4338                 {
4339                   if (loop_dump_stream)
4340                     fprintf (loop_dump_stream,
4341                              "Maximal number of prefetches exceeded.\n");
4342                   return;
4343                 }
4344             }
4345         }
4346     }
4347
4348   for (i = 0; i < num_prefetches; i++)
4349     {
4350       int density;
4351
4352       /* Attempt to calculate the total number of bytes fetched by all
4353          iterations of the loop.  Avoid overflow.  */
4354       if (LOOP_INFO (loop)->n_iterations
4355           && ((unsigned HOST_WIDE_INT) (0xffffffff / info[i].stride)
4356               >= LOOP_INFO (loop)->n_iterations))
4357         info[i].total_bytes = info[i].stride * LOOP_INFO (loop)->n_iterations;
4358       else
4359         info[i].total_bytes = 0xffffffff;
4360
4361       density = info[i].bytes_accessed * 100 / info[i].stride;
4362
4363       /* Prefetch might be worthwhile only when the loads/stores are dense.  */
4364       if (PREFETCH_ONLY_DENSE_MEM)
4365         if (density * 256 > PREFETCH_DENSE_MEM * 100
4366             && (info[i].total_bytes / PREFETCH_BLOCK
4367                 >= PREFETCH_BLOCKS_BEFORE_LOOP_MIN))
4368           {
4369             info[i].prefetch_before_loop = 1;
4370             info[i].prefetch_in_loop
4371               = (info[i].total_bytes / PREFETCH_BLOCK
4372                  > PREFETCH_BLOCKS_BEFORE_LOOP_MAX);
4373           }
4374         else
4375           {
4376             info[i].prefetch_in_loop = 0, info[i].prefetch_before_loop = 0;
4377             if (loop_dump_stream)
4378               fprintf (loop_dump_stream,
4379                   "Prefetch: ignoring giv at %d: %d%% density is too low.\n",
4380                        INSN_UID (info[i].giv->insn), density);
4381           }
4382       else
4383         info[i].prefetch_in_loop = 1, info[i].prefetch_before_loop = 1;
4384
4385       /* Find how many prefetch instructions we'll use within the loop.  */
4386       if (info[i].prefetch_in_loop != 0)
4387         {
4388           info[i].prefetch_in_loop = ((info[i].stride + PREFETCH_BLOCK - 1)
4389                                   / PREFETCH_BLOCK);
4390           num_real_prefetches += info[i].prefetch_in_loop;
4391           if (info[i].write)
4392             num_real_write_prefetches += info[i].prefetch_in_loop;
4393         }
4394     }
4395
4396   /* Determine how many iterations ahead to prefetch within the loop, based
4397      on how many prefetches we currently expect to do within the loop.  */
4398   if (num_real_prefetches != 0)
4399     {
4400       if ((ahead = SIMULTANEOUS_PREFETCHES / num_real_prefetches) == 0)
4401         {
4402           if (loop_dump_stream)
4403             fprintf (loop_dump_stream,
4404                      "Prefetch: ignoring prefetches within loop: ahead is zero; %d < %d\n",
4405                      SIMULTANEOUS_PREFETCHES, num_real_prefetches);
4406           num_real_prefetches = 0, num_real_write_prefetches = 0;
4407         }
4408     }
4409   /* We'll also use AHEAD to determine how many prefetch instructions to
4410      emit before a loop, so don't leave it zero.  */
4411   if (ahead == 0)
4412     ahead = PREFETCH_BLOCKS_BEFORE_LOOP_MAX;
4413
4414   for (i = 0; i < num_prefetches; i++)
4415     {
4416       /* Update if we've decided not to prefetch anything within the loop.  */
4417       if (num_real_prefetches == 0)
4418         info[i].prefetch_in_loop = 0;
4419
4420       /* Find how many prefetch instructions we'll use before the loop.  */
4421       if (info[i].prefetch_before_loop != 0)
4422         {
4423           int n = info[i].total_bytes / PREFETCH_BLOCK;
4424           if (n > ahead)
4425             n = ahead;
4426           info[i].prefetch_before_loop = n;
4427           num_prefetches_before += n;
4428           if (info[i].write)
4429             num_write_prefetches_before += n;
4430         }
4431
4432       if (loop_dump_stream)
4433         {
4434           if (info[i].prefetch_in_loop == 0
4435               && info[i].prefetch_before_loop == 0)
4436             continue;
4437           fprintf (loop_dump_stream, "Prefetch insn: %d",
4438                    INSN_UID (info[i].giv->insn));
4439           fprintf (loop_dump_stream,
4440                    "; in loop: %d; before: %d; %s\n",
4441                    info[i].prefetch_in_loop,
4442                    info[i].prefetch_before_loop,
4443                    info[i].write ? "read/write" : "read only");
4444           fprintf (loop_dump_stream,
4445                    " density: %d%%; bytes_accessed: %u; total_bytes: %u\n",
4446                    (int) (info[i].bytes_accessed * 100 / info[i].stride),
4447                    info[i].bytes_accessed, info[i].total_bytes);
4448           fprintf (loop_dump_stream, " index: " HOST_WIDE_INT_PRINT_DEC
4449                    "; stride: " HOST_WIDE_INT_PRINT_DEC "; address: ",
4450                    info[i].index, info[i].stride);
4451           print_rtl (loop_dump_stream, info[i].base_address);
4452           fprintf (loop_dump_stream, "\n");
4453         }
4454     }
4455
4456   if (num_real_prefetches + num_prefetches_before > 0)
4457     {
4458       /* Record that this loop uses prefetch instructions.  */
4459       LOOP_INFO (loop)->has_prefetch = 1;
4460
4461       if (loop_dump_stream)
4462         {
4463           fprintf (loop_dump_stream, "Real prefetches needed within loop: %d (write: %d)\n",
4464                    num_real_prefetches, num_real_write_prefetches);
4465           fprintf (loop_dump_stream, "Real prefetches needed before loop: %d (write: %d)\n",
4466                    num_prefetches_before, num_write_prefetches_before);
4467         }
4468     }
4469
4470   for (i = 0; i < num_prefetches; i++)
4471     {
4472       int y;
4473
4474       for (y = 0; y < info[i].prefetch_in_loop; y++)
4475         {
4476           rtx loc = copy_rtx (*info[i].giv->location);
4477           rtx insn;
4478           int bytes_ahead = PREFETCH_BLOCK * (ahead + y);
4479           rtx before_insn = info[i].giv->insn;
4480           rtx prev_insn = PREV_INSN (info[i].giv->insn);
4481           rtx seq;
4482
4483           /* We can save some effort by offsetting the address on
4484              architectures with offsettable memory references.  */
4485           if (offsettable_address_p (0, VOIDmode, loc))
4486             loc = plus_constant (loc, bytes_ahead);
4487           else
4488             {
4489               rtx reg = gen_reg_rtx (Pmode);
4490               loop_iv_add_mult_emit_before (loop, loc, const1_rtx,
4491                                             GEN_INT (bytes_ahead), reg,
4492                                             0, before_insn);
4493               loc = reg;
4494             }
4495
4496           start_sequence ();
4497           /* Make sure the address operand is valid for prefetch.  */
4498           if (! (*insn_data[(int)CODE_FOR_prefetch].operand[0].predicate)
4499                   (loc, insn_data[(int)CODE_FOR_prefetch].operand[0].mode))
4500             loc = force_reg (Pmode, loc);
4501           emit_insn (gen_prefetch (loc, GEN_INT (info[i].write),
4502                                    GEN_INT (3)));
4503           seq = get_insns ();
4504           end_sequence ();
4505           emit_insn_before (seq, before_insn);
4506
4507           /* Check all insns emitted and record the new GIV
4508              information.  */
4509           insn = NEXT_INSN (prev_insn);
4510           while (insn != before_insn)
4511             {
4512               insn = check_insn_for_givs (loop, insn,
4513                                           info[i].giv->always_executed,
4514                                           info[i].giv->maybe_multiple);
4515               insn = NEXT_INSN (insn);
4516             }
4517         }
4518
4519       if (PREFETCH_BEFORE_LOOP)
4520         {
4521           /* Emit insns before the loop to fetch the first cache lines or,
4522              if we're not prefetching within the loop, everything we expect
4523              to need.  */
4524           for (y = 0; y < info[i].prefetch_before_loop; y++)
4525             {
4526               rtx reg = gen_reg_rtx (Pmode);
4527               rtx loop_start = loop->start;
4528               rtx init_val = info[i].class->initial_value;
4529               rtx add_val = simplify_gen_binary (PLUS, Pmode,
4530                                                  info[i].giv->add_val,
4531                                                  GEN_INT (y * PREFETCH_BLOCK));
4532
4533               /* Functions called by LOOP_IV_ADD_EMIT_BEFORE expect a
4534                  non-constant INIT_VAL to have the same mode as REG, which
4535                  in this case we know to be Pmode.  */
4536               if (GET_MODE (init_val) != Pmode && !CONSTANT_P (init_val))
4537                 {
4538                   rtx seq;
4539
4540                   start_sequence ();
4541                   init_val = convert_to_mode (Pmode, init_val, 0);
4542                   seq = get_insns ();
4543                   end_sequence ();
4544                   loop_insn_emit_before (loop, 0, loop_start, seq);
4545                 }
4546               loop_iv_add_mult_emit_before (loop, init_val,
4547                                             info[i].giv->mult_val,
4548                                             add_val, reg, 0, loop_start);
4549               emit_insn_before (gen_prefetch (reg, GEN_INT (info[i].write),
4550                                               GEN_INT (3)),
4551                                 loop_start);
4552             }
4553         }
4554     }
4555
4556   return;
4557 }
4558 \f
4559 /* Communication with routines called via `note_stores'.  */
4560
4561 static rtx note_insn;
4562
4563 /* Dummy register to have nonzero DEST_REG for DEST_ADDR type givs.  */
4564
4565 static rtx addr_placeholder;
4566
4567 /* ??? Unfinished optimizations, and possible future optimizations,
4568    for the strength reduction code.  */
4569
4570 /* ??? The interaction of biv elimination, and recognition of 'constant'
4571    bivs, may cause problems.  */
4572
4573 /* ??? Add heuristics so that DEST_ADDR strength reduction does not cause
4574    performance problems.
4575
4576    Perhaps don't eliminate things that can be combined with an addressing
4577    mode.  Find all givs that have the same biv, mult_val, and add_val;
4578    then for each giv, check to see if its only use dies in a following
4579    memory address.  If so, generate a new memory address and check to see
4580    if it is valid.   If it is valid, then store the modified memory address,
4581    otherwise, mark the giv as not done so that it will get its own iv.  */
4582
4583 /* ??? Could try to optimize branches when it is known that a biv is always
4584    positive.  */
4585
4586 /* ??? When replace a biv in a compare insn, we should replace with closest
4587    giv so that an optimized branch can still be recognized by the combiner,
4588    e.g. the VAX acb insn.  */
4589
4590 /* ??? Many of the checks involving uid_luid could be simplified if regscan
4591    was rerun in loop_optimize whenever a register was added or moved.
4592    Also, some of the optimizations could be a little less conservative.  */
4593 \f
4594 /* Searches the insns between INSN and LOOP->END.  Returns 1 if there
4595    is a backward branch in that range that branches to somewhere between
4596    LOOP->START and INSN.  Returns 0 otherwise.  */
4597
4598 /* ??? This is quadratic algorithm.  Could be rewritten to be linear.
4599    In practice, this is not a problem, because this function is seldom called,
4600    and uses a negligible amount of CPU time on average.  */
4601
4602 static int
4603 back_branch_in_range_p (const struct loop *loop, rtx insn)
4604 {
4605   rtx p, q, target_insn;
4606   rtx loop_start = loop->start;
4607   rtx loop_end = loop->end;
4608   rtx orig_loop_end = loop->end;
4609
4610   /* Stop before we get to the backward branch at the end of the loop.  */
4611   loop_end = prev_nonnote_insn (loop_end);
4612   if (BARRIER_P (loop_end))
4613     loop_end = PREV_INSN (loop_end);
4614
4615   /* Check in case insn has been deleted, search forward for first non
4616      deleted insn following it.  */
4617   while (INSN_DELETED_P (insn))
4618     insn = NEXT_INSN (insn);
4619
4620   /* Check for the case where insn is the last insn in the loop.  Deal
4621      with the case where INSN was a deleted loop test insn, in which case
4622      it will now be the NOTE_LOOP_END.  */
4623   if (insn == loop_end || insn == orig_loop_end)
4624     return 0;
4625
4626   for (p = NEXT_INSN (insn); p != loop_end; p = NEXT_INSN (p))
4627     {
4628       if (JUMP_P (p))
4629         {
4630           target_insn = JUMP_LABEL (p);
4631
4632           /* Search from loop_start to insn, to see if one of them is
4633              the target_insn.  We can't use INSN_LUID comparisons here,
4634              since insn may not have an LUID entry.  */
4635           for (q = loop_start; q != insn; q = NEXT_INSN (q))
4636             if (q == target_insn)
4637               return 1;
4638         }
4639     }
4640
4641   return 0;
4642 }
4643
4644 /* Scan the loop body and call FNCALL for each insn.  In the addition to the
4645    LOOP and INSN parameters pass MAYBE_MULTIPLE and NOT_EVERY_ITERATION to the
4646    callback.
4647
4648    NOT_EVERY_ITERATION is 1 if current insn is not known to be executed at
4649    least once for every loop iteration except for the last one.
4650
4651    MAYBE_MULTIPLE is 1 if current insn may be executed more than once for every
4652    loop iteration.
4653  */
4654 typedef rtx (*loop_insn_callback) (struct loop *, rtx, int, int);
4655 static void
4656 for_each_insn_in_loop (struct loop *loop, loop_insn_callback fncall)
4657 {
4658   int not_every_iteration = 0;
4659   int maybe_multiple = 0;
4660   int past_loop_latch = 0;
4661   bool exit_test_is_entry = false;
4662   rtx p;
4663
4664   /* If loop_scan_start points to the loop exit test, the loop body
4665      cannot be counted on running on every iteration, and we have to
4666      be wary of subversive use of gotos inside expression
4667      statements.  */
4668   if (prev_nonnote_insn (loop->scan_start) != prev_nonnote_insn (loop->start))
4669     {
4670       exit_test_is_entry = true;
4671       maybe_multiple = back_branch_in_range_p (loop, loop->scan_start);
4672     }
4673
4674   /* Scan through loop and update NOT_EVERY_ITERATION and MAYBE_MULTIPLE.  */
4675   for (p = next_insn_in_loop (loop, loop->scan_start);
4676        p != NULL_RTX;
4677        p = next_insn_in_loop (loop, p))
4678     {
4679       p = fncall (loop, p, not_every_iteration, maybe_multiple);
4680
4681       /* Past CODE_LABEL, we get to insns that may be executed multiple
4682          times.  The only way we can be sure that they can't is if every
4683          jump insn between here and the end of the loop either
4684          returns, exits the loop, is a jump to a location that is still
4685          behind the label, or is a jump to the loop start.  */
4686
4687       if (LABEL_P (p))
4688         {
4689           rtx insn = p;
4690
4691           maybe_multiple = 0;
4692
4693           while (1)
4694             {
4695               insn = NEXT_INSN (insn);
4696               if (insn == loop->scan_start)
4697                 break;
4698               if (insn == loop->end)
4699                 {
4700                   if (loop->top != 0)
4701                     insn = loop->top;
4702                   else
4703                     break;
4704                   if (insn == loop->scan_start)
4705                     break;
4706                 }
4707
4708               if (JUMP_P (insn)
4709                   && GET_CODE (PATTERN (insn)) != RETURN
4710                   && (!any_condjump_p (insn)
4711                       || (JUMP_LABEL (insn) != 0
4712                           && JUMP_LABEL (insn) != loop->scan_start
4713                           && !loop_insn_first_p (p, JUMP_LABEL (insn)))))
4714                 {
4715                   maybe_multiple = 1;
4716                   break;
4717                 }
4718             }
4719         }
4720
4721       /* Past a jump, we get to insns for which we can't count
4722          on whether they will be executed during each iteration.  */
4723       /* This code appears twice in strength_reduce.  There is also similar
4724          code in scan_loop.  */
4725       if (JUMP_P (p)
4726       /* If we enter the loop in the middle, and scan around to the
4727          beginning, don't set not_every_iteration for that.
4728          This can be any kind of jump, since we want to know if insns
4729          will be executed if the loop is executed.  */
4730           && (exit_test_is_entry
4731               || !(JUMP_LABEL (p) == loop->top
4732                    && ((NEXT_INSN (NEXT_INSN (p)) == loop->end
4733                         && any_uncondjump_p (p))
4734                        || (NEXT_INSN (p) == loop->end
4735                            && any_condjump_p (p))))))
4736         {
4737           rtx label = 0;
4738
4739           /* If this is a jump outside the loop, then it also doesn't
4740              matter.  Check to see if the target of this branch is on the
4741              loop->exits_labels list.  */
4742
4743           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
4744             if (XEXP (label, 0) == JUMP_LABEL (p))
4745               break;
4746
4747           if (!label)
4748             not_every_iteration = 1;
4749         }
4750
4751       /* Note if we pass a loop latch.  If we do, then we can not clear
4752          NOT_EVERY_ITERATION below when we pass the last CODE_LABEL in
4753          a loop since a jump before the last CODE_LABEL may have started
4754          a new loop iteration.
4755
4756          Note that LOOP_TOP is only set for rotated loops and we need
4757          this check for all loops, so compare against the CODE_LABEL
4758          which immediately follows LOOP_START.  */
4759       if (JUMP_P (p)
4760           && JUMP_LABEL (p) == NEXT_INSN (loop->start))
4761         past_loop_latch = 1;
4762
4763       /* Unlike in the code motion pass where MAYBE_NEVER indicates that
4764          an insn may never be executed, NOT_EVERY_ITERATION indicates whether
4765          or not an insn is known to be executed each iteration of the
4766          loop, whether or not any iterations are known to occur.
4767
4768          Therefore, if we have just passed a label and have no more labels
4769          between here and the test insn of the loop, and we have not passed
4770          a jump to the top of the loop, then we know these insns will be
4771          executed each iteration.  */
4772
4773       if (not_every_iteration
4774           && !past_loop_latch
4775           && LABEL_P (p)
4776           && no_labels_between_p (p, loop->end))
4777         not_every_iteration = 0;
4778     }
4779 }
4780 \f
4781 static void
4782 loop_bivs_find (struct loop *loop)
4783 {
4784   struct loop_regs *regs = LOOP_REGS (loop);
4785   struct loop_ivs *ivs = LOOP_IVS (loop);
4786   /* Temporary list pointers for traversing ivs->list.  */
4787   struct iv_class *bl, **backbl;
4788
4789   ivs->list = 0;
4790
4791   for_each_insn_in_loop (loop, check_insn_for_bivs);
4792
4793   /* Scan ivs->list to remove all regs that proved not to be bivs.
4794      Make a sanity check against regs->n_times_set.  */
4795   for (backbl = &ivs->list, bl = *backbl; bl; bl = bl->next)
4796     {
4797       if (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4798           /* Above happens if register modified by subreg, etc.  */
4799           /* Make sure it is not recognized as a basic induction var: */
4800           || regs->array[bl->regno].n_times_set != bl->biv_count
4801           /* If never incremented, it is invariant that we decided not to
4802              move.  So leave it alone.  */
4803           || ! bl->incremented)
4804         {
4805           if (loop_dump_stream)
4806             fprintf (loop_dump_stream, "Biv %d: discarded, %s\n",
4807                      bl->regno,
4808                      (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4809                       ? "not induction variable"
4810                       : (! bl->incremented ? "never incremented"
4811                          : "count error")));
4812
4813           REG_IV_TYPE (ivs, bl->regno) = NOT_BASIC_INDUCT;
4814           *backbl = bl->next;
4815         }
4816       else
4817         {
4818           backbl = &bl->next;
4819
4820           if (loop_dump_stream)
4821             fprintf (loop_dump_stream, "Biv %d: verified\n", bl->regno);
4822         }
4823     }
4824 }
4825
4826
4827 /* Determine how BIVS are initialized by looking through pre-header
4828    extended basic block.  */
4829 static void
4830 loop_bivs_init_find (struct loop *loop)
4831 {
4832   struct loop_ivs *ivs = LOOP_IVS (loop);
4833   /* Temporary list pointers for traversing ivs->list.  */
4834   struct iv_class *bl;
4835   int call_seen;
4836   rtx p;
4837
4838   /* Find initial value for each biv by searching backwards from loop_start,
4839      halting at first label.  Also record any test condition.  */
4840
4841   call_seen = 0;
4842   for (p = loop->start; p && !LABEL_P (p); p = PREV_INSN (p))
4843     {
4844       rtx test;
4845
4846       note_insn = p;
4847
4848       if (CALL_P (p))
4849         call_seen = 1;
4850
4851       if (INSN_P (p))
4852         note_stores (PATTERN (p), record_initial, ivs);
4853
4854       /* Record any test of a biv that branches around the loop if no store
4855          between it and the start of loop.  We only care about tests with
4856          constants and registers and only certain of those.  */
4857       if (JUMP_P (p)
4858           && JUMP_LABEL (p) != 0
4859           && next_real_insn (JUMP_LABEL (p)) == next_real_insn (loop->end)
4860           && (test = get_condition_for_loop (loop, p)) != 0
4861           && REG_P (XEXP (test, 0))
4862           && REGNO (XEXP (test, 0)) < max_reg_before_loop
4863           && (bl = REG_IV_CLASS (ivs, REGNO (XEXP (test, 0)))) != 0
4864           && valid_initial_value_p (XEXP (test, 1), p, call_seen, loop->start)
4865           && bl->init_insn == 0)
4866         {
4867           /* If an NE test, we have an initial value!  */
4868           if (GET_CODE (test) == NE)
4869             {
4870               bl->init_insn = p;
4871               bl->init_set = gen_rtx_SET (VOIDmode,
4872                                           XEXP (test, 0), XEXP (test, 1));
4873             }
4874           else
4875             bl->initial_test = test;
4876         }
4877     }
4878 }
4879
4880
4881 /* Look at the each biv and see if we can say anything better about its
4882    initial value from any initializing insns set up above.  (This is done
4883    in two passes to avoid missing SETs in a PARALLEL.)  */
4884 static void
4885 loop_bivs_check (struct loop *loop)
4886 {
4887   struct loop_ivs *ivs = LOOP_IVS (loop);
4888   /* Temporary list pointers for traversing ivs->list.  */
4889   struct iv_class *bl;
4890   struct iv_class **backbl;
4891
4892   for (backbl = &ivs->list; (bl = *backbl); backbl = &bl->next)
4893     {
4894       rtx src;
4895       rtx note;
4896
4897       if (! bl->init_insn)
4898         continue;
4899
4900       /* IF INIT_INSN has a REG_EQUAL or REG_EQUIV note and the value
4901          is a constant, use the value of that.  */
4902       if (((note = find_reg_note (bl->init_insn, REG_EQUAL, 0)) != NULL
4903            && CONSTANT_P (XEXP (note, 0)))
4904           || ((note = find_reg_note (bl->init_insn, REG_EQUIV, 0)) != NULL
4905               && CONSTANT_P (XEXP (note, 0))))
4906         src = XEXP (note, 0);
4907       else
4908         src = SET_SRC (bl->init_set);
4909
4910       if (loop_dump_stream)
4911         fprintf (loop_dump_stream,
4912                  "Biv %d: initialized at insn %d: initial value ",
4913                  bl->regno, INSN_UID (bl->init_insn));
4914
4915       if ((GET_MODE (src) == GET_MODE (regno_reg_rtx[bl->regno])
4916            || GET_MODE (src) == VOIDmode)
4917           && valid_initial_value_p (src, bl->init_insn,
4918                                     LOOP_INFO (loop)->pre_header_has_call,
4919                                     loop->start))
4920         {
4921           bl->initial_value = src;
4922
4923           if (loop_dump_stream)
4924             {
4925               print_simple_rtl (loop_dump_stream, src);
4926               fputc ('\n', loop_dump_stream);
4927             }
4928         }
4929       /* If we can't make it a giv,
4930          let biv keep initial value of "itself".  */
4931       else if (loop_dump_stream)
4932         fprintf (loop_dump_stream, "is complex\n");
4933     }
4934 }
4935
4936
4937 /* Search the loop for general induction variables.  */
4938
4939 static void
4940 loop_givs_find (struct loop* loop)
4941 {
4942   for_each_insn_in_loop (loop, check_insn_for_givs);
4943 }
4944
4945
4946 /* For each giv for which we still don't know whether or not it is
4947    replaceable, check to see if it is replaceable because its final value
4948    can be calculated.  */
4949
4950 static void
4951 loop_givs_check (struct loop *loop)
4952 {
4953   struct loop_ivs *ivs = LOOP_IVS (loop);
4954   struct iv_class *bl;
4955
4956   for (bl = ivs->list; bl; bl = bl->next)
4957     {
4958       struct induction *v;
4959
4960       for (v = bl->giv; v; v = v->next_iv)
4961         if (! v->replaceable && ! v->not_replaceable)
4962           check_final_value (loop, v);
4963     }
4964 }
4965
4966 /* Try to generate the simplest rtx for the expression
4967    (PLUS (MULT mult1 mult2) add1).  This is used to calculate the initial
4968    value of giv's.  */
4969
4970 static rtx
4971 fold_rtx_mult_add (rtx mult1, rtx mult2, rtx add1, enum machine_mode mode)
4972 {
4973   rtx temp, mult_res;
4974   rtx result;
4975
4976   /* The modes must all be the same.  This should always be true.  For now,
4977      check to make sure.  */
4978   gcc_assert (GET_MODE (mult1) == mode || GET_MODE (mult1) == VOIDmode);
4979   gcc_assert (GET_MODE (mult2) == mode || GET_MODE (mult2) == VOIDmode);
4980   gcc_assert (GET_MODE (add1) == mode || GET_MODE (add1) == VOIDmode);
4981
4982   /* Ensure that if at least one of mult1/mult2 are constant, then mult2
4983      will be a constant.  */
4984   if (GET_CODE (mult1) == CONST_INT)
4985     {
4986       temp = mult2;
4987       mult2 = mult1;
4988       mult1 = temp;
4989     }
4990
4991   mult_res = simplify_binary_operation (MULT, mode, mult1, mult2);
4992   if (! mult_res)
4993     mult_res = gen_rtx_MULT (mode, mult1, mult2);
4994
4995   /* Again, put the constant second.  */
4996   if (GET_CODE (add1) == CONST_INT)
4997     {
4998       temp = add1;
4999       add1 = mult_res;
5000       mult_res = temp;
5001     }
5002
5003   result = simplify_binary_operation (PLUS, mode, add1, mult_res);
5004   if (! result)
5005     result = gen_rtx_PLUS (mode, add1, mult_res);
5006
5007   return result;
5008 }
5009
5010 /* Searches the list of induction struct's for the biv BL, to try to calculate
5011    the total increment value for one iteration of the loop as a constant.
5012
5013    Returns the increment value as an rtx, simplified as much as possible,
5014    if it can be calculated.  Otherwise, returns 0.  */
5015
5016 static rtx
5017 biv_total_increment (const struct iv_class *bl)
5018 {
5019   struct induction *v;
5020   rtx result;
5021
5022   /* For increment, must check every instruction that sets it.  Each
5023      instruction must be executed only once each time through the loop.
5024      To verify this, we check that the insn is always executed, and that
5025      there are no backward branches after the insn that branch to before it.
5026      Also, the insn must have a mult_val of one (to make sure it really is
5027      an increment).  */
5028
5029   result = const0_rtx;
5030   for (v = bl->biv; v; v = v->next_iv)
5031     {
5032       if (v->always_computable && v->mult_val == const1_rtx
5033           && ! v->maybe_multiple
5034           && SCALAR_INT_MODE_P (v->mode))
5035         {
5036           /* If we have already counted it, skip it.  */
5037           if (v->same)
5038             continue;
5039
5040           result = fold_rtx_mult_add (result, const1_rtx, v->add_val, v->mode);
5041         }
5042       else
5043         return 0;
5044     }
5045
5046   return result;
5047 }
5048
5049 /* Try to prove that the register is dead after the loop exits.  Trace every
5050    loop exit looking for an insn that will always be executed, which sets
5051    the register to some value, and appears before the first use of the register
5052    is found.  If successful, then return 1, otherwise return 0.  */
5053
5054 /* ?? Could be made more intelligent in the handling of jumps, so that
5055    it can search past if statements and other similar structures.  */
5056
5057 static int
5058 reg_dead_after_loop (const struct loop *loop, rtx reg)
5059 {
5060   rtx insn, label;
5061   int jump_count = 0;
5062   int label_count = 0;
5063
5064   /* In addition to checking all exits of this loop, we must also check
5065      all exits of inner nested loops that would exit this loop.  We don't
5066      have any way to identify those, so we just give up if there are any
5067      such inner loop exits.  */
5068
5069   for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
5070     label_count++;
5071
5072   if (label_count != loop->exit_count)
5073     return 0;
5074
5075   /* HACK: Must also search the loop fall through exit, create a label_ref
5076      here which points to the loop->end, and append the loop_number_exit_labels
5077      list to it.  */
5078   label = gen_rtx_LABEL_REF (Pmode, loop->end);
5079   LABEL_NEXTREF (label) = loop->exit_labels;
5080
5081   for (; label; label = LABEL_NEXTREF (label))
5082     {
5083       /* Succeed if find an insn which sets the biv or if reach end of
5084          function.  Fail if find an insn that uses the biv, or if come to
5085          a conditional jump.  */
5086
5087       insn = NEXT_INSN (XEXP (label, 0));
5088       while (insn)
5089         {
5090           if (INSN_P (insn))
5091             {
5092               rtx set, note;
5093
5094               if (reg_referenced_p (reg, PATTERN (insn)))
5095                 return 0;
5096
5097               note = find_reg_equal_equiv_note (insn);
5098               if (note && reg_overlap_mentioned_p (reg, XEXP (note, 0)))
5099                 return 0;
5100
5101               set = single_set (insn);
5102               if (set && rtx_equal_p (SET_DEST (set), reg))
5103                 break;
5104
5105               if (JUMP_P (insn))
5106                 {
5107                   if (GET_CODE (PATTERN (insn)) == RETURN)
5108                     break;
5109                   else if (!any_uncondjump_p (insn)
5110                            /* Prevent infinite loop following infinite loops.  */
5111                            || jump_count++ > 20)
5112                     return 0;
5113                   else
5114                     insn = JUMP_LABEL (insn);
5115                 }
5116             }
5117
5118           insn = NEXT_INSN (insn);
5119         }
5120     }
5121
5122   /* Success, the register is dead on all loop exits.  */
5123   return 1;
5124 }
5125
5126 /* Try to calculate the final value of the biv, the value it will have at
5127    the end of the loop.  If we can do it, return that value.  */
5128
5129 static rtx
5130 final_biv_value (const struct loop *loop, struct iv_class *bl)
5131 {
5132   unsigned HOST_WIDE_INT n_iterations = LOOP_INFO (loop)->n_iterations;
5133   rtx increment, tem;
5134
5135   /* ??? This only works for MODE_INT biv's.  Reject all others for now.  */
5136
5137   if (GET_MODE_CLASS (bl->biv->mode) != MODE_INT)
5138     return 0;
5139
5140   /* The final value for reversed bivs must be calculated differently than
5141      for ordinary bivs.  In this case, there is already an insn after the
5142      loop which sets this biv's final value (if necessary), and there are
5143      no other loop exits, so we can return any value.  */
5144   if (bl->reversed)
5145     {
5146       if (loop_dump_stream)
5147         fprintf (loop_dump_stream,
5148                  "Final biv value for %d, reversed biv.\n", bl->regno);
5149
5150       return const0_rtx;
5151     }
5152
5153   /* Try to calculate the final value as initial value + (number of iterations
5154      * increment).  For this to work, increment must be invariant, the only
5155      exit from the loop must be the fall through at the bottom (otherwise
5156      it may not have its final value when the loop exits), and the initial
5157      value of the biv must be invariant.  */
5158
5159   if (n_iterations != 0
5160       && ! loop->exit_count
5161       && loop_invariant_p (loop, bl->initial_value))
5162     {
5163       increment = biv_total_increment (bl);
5164
5165       if (increment && loop_invariant_p (loop, increment))
5166         {
5167           /* Can calculate the loop exit value, emit insns after loop
5168              end to calculate this value into a temporary register in
5169              case it is needed later.  */
5170
5171           tem = gen_reg_rtx (bl->biv->mode);
5172           record_base_value (REGNO (tem), bl->biv->add_val, 0);
5173           loop_iv_add_mult_sink (loop, increment, GEN_INT (n_iterations),
5174                                  bl->initial_value, tem);
5175
5176           if (loop_dump_stream)
5177             fprintf (loop_dump_stream,
5178                      "Final biv value for %d, calculated.\n", bl->regno);
5179
5180           return tem;
5181         }
5182     }
5183
5184   /* Check to see if the biv is dead at all loop exits.  */
5185   if (reg_dead_after_loop (loop, bl->biv->src_reg))
5186     {
5187       if (loop_dump_stream)
5188         fprintf (loop_dump_stream,
5189                  "Final biv value for %d, biv dead after loop exit.\n",
5190                  bl->regno);
5191
5192       return const0_rtx;
5193     }
5194
5195   return 0;
5196 }
5197
5198 /* Return nonzero if it is possible to eliminate the biv BL provided
5199    all givs are reduced.  This is possible if either the reg is not
5200    used outside the loop, or we can compute what its final value will
5201    be.  */
5202
5203 static int
5204 loop_biv_eliminable_p (struct loop *loop, struct iv_class *bl,
5205                        int threshold, int insn_count)
5206 {
5207   /* For architectures with a decrement_and_branch_until_zero insn,
5208      don't do this if we put a REG_NONNEG note on the endtest for this
5209      biv.  */
5210
5211 #ifdef HAVE_decrement_and_branch_until_zero
5212   if (bl->nonneg)
5213     {
5214       if (loop_dump_stream)
5215         fprintf (loop_dump_stream,
5216                  "Cannot eliminate nonneg biv %d.\n", bl->regno);
5217       return 0;
5218     }
5219 #endif
5220
5221   /* Check that biv is used outside loop or if it has a final value.
5222      Compare against bl->init_insn rather than loop->start.  We aren't
5223      concerned with any uses of the biv between init_insn and
5224      loop->start since these won't be affected by the value of the biv
5225      elsewhere in the function, so long as init_insn doesn't use the
5226      biv itself.  */
5227
5228   if ((REGNO_LAST_LUID (bl->regno) < INSN_LUID (loop->end)
5229        && bl->init_insn
5230        && INSN_UID (bl->init_insn) < max_uid_for_loop
5231        && REGNO_FIRST_LUID (bl->regno) >= INSN_LUID (bl->init_insn)
5232        && ! reg_mentioned_p (bl->biv->dest_reg, SET_SRC (bl->init_set)))
5233       || (bl->final_value = final_biv_value (loop, bl)))
5234     return maybe_eliminate_biv (loop, bl, 0, threshold, insn_count);
5235
5236   if (loop_dump_stream)
5237     {
5238       fprintf (loop_dump_stream,
5239                "Cannot eliminate biv %d.\n",
5240                bl->regno);
5241       fprintf (loop_dump_stream,
5242                "First use: insn %d, last use: insn %d.\n",
5243                REGNO_FIRST_UID (bl->regno),
5244                REGNO_LAST_UID (bl->regno));
5245     }
5246   return 0;
5247 }
5248
5249
5250 /* Reduce each giv of BL that we have decided to reduce.  */
5251
5252 static void
5253 loop_givs_reduce (struct loop *loop, struct iv_class *bl)
5254 {
5255   struct induction *v;
5256
5257   for (v = bl->giv; v; v = v->next_iv)
5258     {
5259       struct induction *tv;
5260       if (! v->ignore && v->same == 0)
5261         {
5262           int auto_inc_opt = 0;
5263
5264           /* If the code for derived givs immediately below has already
5265              allocated a new_reg, we must keep it.  */
5266           if (! v->new_reg)
5267             v->new_reg = gen_reg_rtx (v->mode);
5268
5269 #ifdef AUTO_INC_DEC
5270           /* If the target has auto-increment addressing modes, and
5271              this is an address giv, then try to put the increment
5272              immediately after its use, so that flow can create an
5273              auto-increment addressing mode.  */
5274           /* Don't do this for loops entered at the bottom, to avoid
5275              this invalid transformation:
5276                 jmp L;          ->          jmp L;
5277              TOP:                       TOP:
5278                 use giv                     use giv
5279              L:                             inc giv
5280                 inc biv                 L:
5281                 test biv                    test giv
5282                 cbr TOP                     cbr TOP
5283           */
5284           if (v->giv_type == DEST_ADDR && bl->biv_count == 1
5285               && bl->biv->always_executed && ! bl->biv->maybe_multiple
5286               /* We don't handle reversed biv's because bl->biv->insn
5287                  does not have a valid INSN_LUID.  */
5288               && ! bl->reversed
5289               && v->always_executed && ! v->maybe_multiple
5290               && INSN_UID (v->insn) < max_uid_for_loop
5291               && !loop->top)
5292             {
5293               /* If other giv's have been combined with this one, then
5294                  this will work only if all uses of the other giv's occur
5295                  before this giv's insn.  This is difficult to check.
5296
5297                  We simplify this by looking for the common case where
5298                  there is one DEST_REG giv, and this giv's insn is the
5299                  last use of the dest_reg of that DEST_REG giv.  If the
5300                  increment occurs after the address giv, then we can
5301                  perform the optimization.  (Otherwise, the increment
5302                  would have to go before other_giv, and we would not be
5303                  able to combine it with the address giv to get an
5304                  auto-inc address.)  */
5305               if (v->combined_with)
5306                 {
5307                   struct induction *other_giv = 0;
5308
5309                   for (tv = bl->giv; tv; tv = tv->next_iv)
5310                     if (tv->same == v)
5311                       {
5312                         if (other_giv)
5313                           break;
5314                         else
5315                           other_giv = tv;
5316                       }
5317                   if (! tv && other_giv
5318                       && REGNO (other_giv->dest_reg) < max_reg_before_loop
5319                       && (REGNO_LAST_UID (REGNO (other_giv->dest_reg))
5320                           == INSN_UID (v->insn))
5321                       && INSN_LUID (v->insn) < INSN_LUID (bl->biv->insn))
5322                     auto_inc_opt = 1;
5323                 }
5324               /* Check for case where increment is before the address
5325                  giv.  Do this test in "loop order".  */
5326               else if ((INSN_LUID (v->insn) > INSN_LUID (bl->biv->insn)
5327                         && (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
5328                             || (INSN_LUID (bl->biv->insn)
5329                                 > INSN_LUID (loop->scan_start))))
5330                        || (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
5331                            && (INSN_LUID (loop->scan_start)
5332                                < INSN_LUID (bl->biv->insn))))
5333                 auto_inc_opt = -1;
5334               else
5335                 auto_inc_opt = 1;
5336
5337 #ifdef HAVE_cc0
5338               {
5339                 rtx prev;
5340
5341                 /* We can't put an insn immediately after one setting
5342                    cc0, or immediately before one using cc0.  */
5343                 if ((auto_inc_opt == 1 && sets_cc0_p (PATTERN (v->insn)))
5344                     || (auto_inc_opt == -1
5345                         && (prev = prev_nonnote_insn (v->insn)) != 0
5346                         && INSN_P (prev)
5347                         && sets_cc0_p (PATTERN (prev))))
5348                   auto_inc_opt = 0;
5349               }
5350 #endif
5351
5352               if (auto_inc_opt)
5353                 v->auto_inc_opt = 1;
5354             }
5355 #endif
5356
5357           /* For each place where the biv is incremented, add an insn
5358              to increment the new, reduced reg for the giv.  */
5359           for (tv = bl->biv; tv; tv = tv->next_iv)
5360             {
5361               rtx insert_before;
5362
5363               /* Skip if location is the same as a previous one.  */
5364               if (tv->same)
5365                 continue;
5366               if (! auto_inc_opt)
5367                 insert_before = NEXT_INSN (tv->insn);
5368               else if (auto_inc_opt == 1)
5369                 insert_before = NEXT_INSN (v->insn);
5370               else
5371                 insert_before = v->insn;
5372
5373               if (tv->mult_val == const1_rtx)
5374                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
5375                                               v->new_reg, v->new_reg,
5376                                               0, insert_before);
5377               else /* tv->mult_val == const0_rtx */
5378                 /* A multiply is acceptable here
5379                    since this is presumed to be seldom executed.  */
5380                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
5381                                               v->add_val, v->new_reg,
5382                                               0, insert_before);
5383             }
5384
5385           /* Add code at loop start to initialize giv's reduced reg.  */
5386
5387           loop_iv_add_mult_hoist (loop,
5388                                   extend_value_for_giv (v, bl->initial_value),
5389                                   v->mult_val, v->add_val, v->new_reg);
5390         }
5391     }
5392 }
5393
5394
5395 /* Check for givs whose first use is their definition and whose
5396    last use is the definition of another giv.  If so, it is likely
5397    dead and should not be used to derive another giv nor to
5398    eliminate a biv.  */
5399
5400 static void
5401 loop_givs_dead_check (struct loop *loop ATTRIBUTE_UNUSED, struct iv_class *bl)
5402 {
5403   struct induction *v;
5404
5405   for (v = bl->giv; v; v = v->next_iv)
5406     {
5407       if (v->ignore
5408           || (v->same && v->same->ignore))
5409         continue;
5410
5411       if (v->giv_type == DEST_REG
5412           && REGNO_FIRST_UID (REGNO (v->dest_reg)) == INSN_UID (v->insn))
5413         {
5414           struct induction *v1;
5415
5416           for (v1 = bl->giv; v1; v1 = v1->next_iv)
5417             if (REGNO_LAST_UID (REGNO (v->dest_reg)) == INSN_UID (v1->insn))
5418               v->maybe_dead = 1;
5419         }
5420     }
5421 }
5422
5423
5424 static void
5425 loop_givs_rescan (struct loop *loop, struct iv_class *bl, rtx *reg_map)
5426 {
5427   struct induction *v;
5428
5429   for (v = bl->giv; v; v = v->next_iv)
5430     {
5431       if (v->same && v->same->ignore)
5432         v->ignore = 1;
5433
5434       if (v->ignore)
5435         continue;
5436
5437       /* Update expression if this was combined, in case other giv was
5438          replaced.  */
5439       if (v->same)
5440         v->new_reg = replace_rtx (v->new_reg,
5441                                   v->same->dest_reg, v->same->new_reg);
5442
5443       /* See if this register is known to be a pointer to something.  If
5444          so, see if we can find the alignment.  First see if there is a
5445          destination register that is a pointer.  If so, this shares the
5446          alignment too.  Next see if we can deduce anything from the
5447          computational information.  If not, and this is a DEST_ADDR
5448          giv, at least we know that it's a pointer, though we don't know
5449          the alignment.  */
5450       if (REG_P (v->new_reg)
5451           && v->giv_type == DEST_REG
5452           && REG_POINTER (v->dest_reg))
5453         mark_reg_pointer (v->new_reg,
5454                           REGNO_POINTER_ALIGN (REGNO (v->dest_reg)));
5455       else if (REG_P (v->new_reg)
5456                && REG_POINTER (v->src_reg))
5457         {
5458           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->src_reg));
5459
5460           if (align == 0
5461               || GET_CODE (v->add_val) != CONST_INT
5462               || INTVAL (v->add_val) % (align / BITS_PER_UNIT) != 0)
5463             align = 0;
5464
5465           mark_reg_pointer (v->new_reg, align);
5466         }
5467       else if (REG_P (v->new_reg)
5468                && REG_P (v->add_val)
5469                && REG_POINTER (v->add_val))
5470         {
5471           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->add_val));
5472
5473           if (align == 0 || GET_CODE (v->mult_val) != CONST_INT
5474               || INTVAL (v->mult_val) % (align / BITS_PER_UNIT) != 0)
5475             align = 0;
5476
5477           mark_reg_pointer (v->new_reg, align);
5478         }
5479       else if (REG_P (v->new_reg) && v->giv_type == DEST_ADDR)
5480         mark_reg_pointer (v->new_reg, 0);
5481
5482       if (v->giv_type == DEST_ADDR)
5483         {
5484           /* Store reduced reg as the address in the memref where we found
5485              this giv.  */
5486           if (validate_change_maybe_volatile (v->insn, v->location,
5487                                               v->new_reg))
5488             /* Yay, it worked!  */;
5489           /* Not replaceable; emit an insn to set the original
5490              giv reg from the reduced giv.  */
5491           else if (REG_P (*v->location))
5492             loop_insn_emit_before (loop, 0, v->insn,
5493                                    gen_move_insn (*v->location,
5494                                                   v->new_reg));
5495           else if (GET_CODE (*v->location) == PLUS
5496                    && REG_P (XEXP (*v->location, 0))
5497                    && CONSTANT_P (XEXP (*v->location, 1)))
5498             loop_insn_emit_before (loop, 0, v->insn,
5499                                    gen_move_insn (XEXP (*v->location, 0),
5500                                                   gen_rtx_MINUS
5501                                                   (GET_MODE (*v->location),
5502                                                    v->new_reg,
5503                                                    XEXP (*v->location, 1))));
5504           else
5505             {
5506               /* If it wasn't a reg, create a pseudo and use that.  */
5507               rtx reg, seq;
5508               start_sequence ();
5509               reg = force_reg (v->mode, *v->location);
5510               seq = get_insns ();
5511               end_sequence ();
5512               loop_insn_emit_before (loop, 0, v->insn, seq);
5513               if (!validate_change_maybe_volatile (v->insn, v->location, reg))
5514                 gcc_unreachable ();
5515             }
5516         }
5517       else if (v->replaceable)
5518         {
5519           reg_map[REGNO (v->dest_reg)] = v->new_reg;
5520         }
5521       else
5522         {
5523           rtx original_insn = v->insn;
5524           rtx note;
5525
5526           /* Not replaceable; emit an insn to set the original giv reg from
5527              the reduced giv, same as above.  */
5528           v->insn = loop_insn_emit_after (loop, 0, original_insn,
5529                                           gen_move_insn (v->dest_reg,
5530                                                          v->new_reg));
5531
5532           /* The original insn may have a REG_EQUAL note.  This note is
5533              now incorrect and may result in invalid substitutions later.
5534              The original insn is dead, but may be part of a libcall
5535              sequence, which doesn't seem worth the bother of handling.  */
5536           note = find_reg_note (original_insn, REG_EQUAL, NULL_RTX);
5537           if (note)
5538             remove_note (original_insn, note);
5539         }
5540
5541       /* When a loop is reversed, givs which depend on the reversed
5542          biv, and which are live outside the loop, must be set to their
5543          correct final value.  This insn is only needed if the giv is
5544          not replaceable.  The correct final value is the same as the
5545          value that the giv starts the reversed loop with.  */
5546       if (bl->reversed && ! v->replaceable)
5547         loop_iv_add_mult_sink (loop,
5548                                extend_value_for_giv (v, bl->initial_value),
5549                                v->mult_val, v->add_val, v->dest_reg);
5550       else if (v->final_value)
5551         loop_insn_sink_or_swim (loop,
5552                                 gen_load_of_final_value (v->dest_reg,
5553                                                          v->final_value));
5554
5555       if (loop_dump_stream)
5556         {
5557           fprintf (loop_dump_stream, "giv at %d reduced to ",
5558                    INSN_UID (v->insn));
5559           print_simple_rtl (loop_dump_stream, v->new_reg);
5560           fprintf (loop_dump_stream, "\n");
5561         }
5562     }
5563 }
5564
5565
5566 static int
5567 loop_giv_reduce_benefit (struct loop *loop ATTRIBUTE_UNUSED,
5568                          struct iv_class *bl, struct induction *v,
5569                          rtx test_reg)
5570 {
5571   int add_cost;
5572   int benefit;
5573
5574   benefit = v->benefit;
5575   PUT_MODE (test_reg, v->mode);
5576   add_cost = iv_add_mult_cost (bl->biv->add_val, v->mult_val,
5577                                test_reg, test_reg);
5578
5579   /* Reduce benefit if not replaceable, since we will insert a
5580      move-insn to replace the insn that calculates this giv.  Don't do
5581      this unless the giv is a user variable, since it will often be
5582      marked non-replaceable because of the duplication of the exit
5583      code outside the loop.  In such a case, the copies we insert are
5584      dead and will be deleted.  So they don't have a cost.  Similar
5585      situations exist.  */
5586   /* ??? The new final_[bg]iv_value code does a much better job of
5587      finding replaceable giv's, and hence this code may no longer be
5588      necessary.  */
5589   if (! v->replaceable && ! bl->eliminable
5590       && REG_USERVAR_P (v->dest_reg))
5591     benefit -= copy_cost;
5592
5593   /* Decrease the benefit to count the add-insns that we will insert
5594      to increment the reduced reg for the giv.  ??? This can
5595      overestimate the run-time cost of the additional insns, e.g. if
5596      there are multiple basic blocks that increment the biv, but only
5597      one of these blocks is executed during each iteration.  There is
5598      no good way to detect cases like this with the current structure
5599      of the loop optimizer.  This code is more accurate for
5600      determining code size than run-time benefits.  */
5601   benefit -= add_cost * bl->biv_count;
5602
5603   /* Decide whether to strength-reduce this giv or to leave the code
5604      unchanged (recompute it from the biv each time it is used).  This
5605      decision can be made independently for each giv.  */
5606
5607 #ifdef AUTO_INC_DEC
5608   /* Attempt to guess whether autoincrement will handle some of the
5609      new add insns; if so, increase BENEFIT (undo the subtraction of
5610      add_cost that was done above).  */
5611   if (v->giv_type == DEST_ADDR
5612       /* Increasing the benefit is risky, since this is only a guess.
5613          Avoid increasing register pressure in cases where there would
5614          be no other benefit from reducing this giv.  */
5615       && benefit > 0
5616       && GET_CODE (v->mult_val) == CONST_INT)
5617     {
5618       int size = GET_MODE_SIZE (GET_MODE (v->mem));
5619
5620       if (HAVE_POST_INCREMENT
5621           && INTVAL (v->mult_val) == size)
5622         benefit += add_cost * bl->biv_count;
5623       else if (HAVE_PRE_INCREMENT
5624                && INTVAL (v->mult_val) == size)
5625         benefit += add_cost * bl->biv_count;
5626       else if (HAVE_POST_DECREMENT
5627                && -INTVAL (v->mult_val) == size)
5628         benefit += add_cost * bl->biv_count;
5629       else if (HAVE_PRE_DECREMENT
5630                && -INTVAL (v->mult_val) == size)
5631         benefit += add_cost * bl->biv_count;
5632     }
5633 #endif
5634
5635   return benefit;
5636 }
5637
5638
5639 /* Free IV structures for LOOP.  */
5640
5641 static void
5642 loop_ivs_free (struct loop *loop)
5643 {
5644   struct loop_ivs *ivs = LOOP_IVS (loop);
5645   struct iv_class *iv = ivs->list;
5646
5647   free (ivs->regs);
5648
5649   while (iv)
5650     {
5651       struct iv_class *next = iv->next;
5652       struct induction *induction;
5653       struct induction *next_induction;
5654
5655       for (induction = iv->biv; induction; induction = next_induction)
5656         {
5657           next_induction = induction->next_iv;
5658           free (induction);
5659         }
5660       for (induction = iv->giv; induction; induction = next_induction)
5661         {
5662           next_induction = induction->next_iv;
5663           free (induction);
5664         }
5665
5666       free (iv);
5667       iv = next;
5668     }
5669 }
5670
5671 /* Look back before LOOP->START for the insn that sets REG and return
5672    the equivalent constant if there is a REG_EQUAL note otherwise just
5673    the SET_SRC of REG.  */
5674
5675 static rtx
5676 loop_find_equiv_value (const struct loop *loop, rtx reg)
5677 {
5678   rtx loop_start = loop->start;
5679   rtx insn, set;
5680   rtx ret;
5681
5682   ret = reg;
5683   for (insn = PREV_INSN (loop_start); insn; insn = PREV_INSN (insn))
5684     {
5685       if (LABEL_P (insn))
5686         break;
5687
5688       else if (INSN_P (insn) && reg_set_p (reg, insn))
5689         {
5690           /* We found the last insn before the loop that sets the register.
5691              If it sets the entire register, and has a REG_EQUAL note,
5692              then use the value of the REG_EQUAL note.  */
5693           if ((set = single_set (insn))
5694               && (SET_DEST (set) == reg))
5695             {
5696               rtx note = find_reg_note (insn, REG_EQUAL, NULL_RTX);
5697
5698               /* Only use the REG_EQUAL note if it is a constant.
5699                  Other things, divide in particular, will cause
5700                  problems later if we use them.  */
5701               if (note && GET_CODE (XEXP (note, 0)) != EXPR_LIST
5702                   && CONSTANT_P (XEXP (note, 0)))
5703                 ret = XEXP (note, 0);
5704               else
5705                 ret = SET_SRC (set);
5706
5707               /* We cannot do this if it changes between the
5708                  assignment and loop start though.  */
5709               if (modified_between_p (ret, insn, loop_start))
5710                 ret = reg;
5711             }
5712           break;
5713         }
5714     }
5715   return ret;
5716 }
5717
5718 /* Find and return register term common to both expressions OP0 and
5719    OP1 or NULL_RTX if no such term exists.  Each expression must be a
5720    REG or a PLUS of a REG.  */
5721
5722 static rtx
5723 find_common_reg_term (rtx op0, rtx op1)
5724 {
5725   if ((REG_P (op0) || GET_CODE (op0) == PLUS)
5726       && (REG_P (op1) || GET_CODE (op1) == PLUS))
5727     {
5728       rtx op00;
5729       rtx op01;
5730       rtx op10;
5731       rtx op11;
5732
5733       if (GET_CODE (op0) == PLUS)
5734         op01 = XEXP (op0, 1), op00 = XEXP (op0, 0);
5735       else
5736         op01 = const0_rtx, op00 = op0;
5737
5738       if (GET_CODE (op1) == PLUS)
5739         op11 = XEXP (op1, 1), op10 = XEXP (op1, 0);
5740       else
5741         op11 = const0_rtx, op10 = op1;
5742
5743       /* Find and return common register term if present.  */
5744       if (REG_P (op00) && (op00 == op10 || op00 == op11))
5745         return op00;
5746       else if (REG_P (op01) && (op01 == op10 || op01 == op11))
5747         return op01;
5748     }
5749
5750   /* No common register term found.  */
5751   return NULL_RTX;
5752 }
5753
5754 /* Determine the loop iterator and calculate the number of loop
5755    iterations.  Returns the exact number of loop iterations if it can
5756    be calculated, otherwise returns zero.  */
5757
5758 static unsigned HOST_WIDE_INT
5759 loop_iterations (struct loop *loop)
5760 {
5761   struct loop_info *loop_info = LOOP_INFO (loop);
5762   struct loop_ivs *ivs = LOOP_IVS (loop);
5763   rtx comparison, comparison_value;
5764   rtx iteration_var, initial_value, increment, final_value;
5765   enum rtx_code comparison_code;
5766   HOST_WIDE_INT inc;
5767   unsigned HOST_WIDE_INT abs_inc;
5768   unsigned HOST_WIDE_INT abs_diff;
5769   int off_by_one;
5770   int increment_dir;
5771   int unsigned_p, compare_dir, final_larger;
5772   rtx last_loop_insn;
5773   struct iv_class *bl;
5774
5775   loop_info->n_iterations = 0;
5776   loop_info->initial_value = 0;
5777   loop_info->initial_equiv_value = 0;
5778   loop_info->comparison_value = 0;
5779   loop_info->final_value = 0;
5780   loop_info->final_equiv_value = 0;
5781   loop_info->increment = 0;
5782   loop_info->iteration_var = 0;
5783   loop_info->iv = 0;
5784
5785   /* We used to use prev_nonnote_insn here, but that fails because it might
5786      accidentally get the branch for a contained loop if the branch for this
5787      loop was deleted.  We can only trust branches immediately before the
5788      loop_end.  */
5789   last_loop_insn = PREV_INSN (loop->end);
5790
5791   /* ??? We should probably try harder to find the jump insn
5792      at the end of the loop.  The following code assumes that
5793      the last loop insn is a jump to the top of the loop.  */
5794   if (!JUMP_P (last_loop_insn))
5795     {
5796       if (loop_dump_stream)
5797         fprintf (loop_dump_stream,
5798                  "Loop iterations: No final conditional branch found.\n");
5799       return 0;
5800     }
5801
5802   /* If there is a more than a single jump to the top of the loop
5803      we cannot (easily) determine the iteration count.  */
5804   if (LABEL_NUSES (JUMP_LABEL (last_loop_insn)) > 1)
5805     {
5806       if (loop_dump_stream)
5807         fprintf (loop_dump_stream,
5808                  "Loop iterations: Loop has multiple back edges.\n");
5809       return 0;
5810     }
5811
5812   /* Find the iteration variable.  If the last insn is a conditional
5813      branch, and the insn before tests a register value, make that the
5814      iteration variable.  */
5815
5816   comparison = get_condition_for_loop (loop, last_loop_insn);
5817   if (comparison == 0)
5818     {
5819       if (loop_dump_stream)
5820         fprintf (loop_dump_stream,
5821                  "Loop iterations: No final comparison found.\n");
5822       return 0;
5823     }
5824
5825   /* ??? Get_condition may switch position of induction variable and
5826      invariant register when it canonicalizes the comparison.  */
5827
5828   comparison_code = GET_CODE (comparison);
5829   iteration_var = XEXP (comparison, 0);
5830   comparison_value = XEXP (comparison, 1);
5831
5832   if (!REG_P (iteration_var))
5833     {
5834       if (loop_dump_stream)
5835         fprintf (loop_dump_stream,
5836                  "Loop iterations: Comparison not against register.\n");
5837       return 0;
5838     }
5839
5840   /* The only new registers that are created before loop iterations
5841      are givs made from biv increments or registers created by
5842      load_mems.  In the latter case, it is possible that try_copy_prop
5843      will propagate a new pseudo into the old iteration register but
5844      this will be marked by having the REG_USERVAR_P bit set.  */
5845
5846   gcc_assert ((unsigned) REGNO (iteration_var) < ivs->n_regs
5847               || REG_USERVAR_P (iteration_var));
5848
5849   /* Determine the initial value of the iteration variable, and the amount
5850      that it is incremented each loop.  Use the tables constructed by
5851      the strength reduction pass to calculate these values.  */
5852
5853   /* Clear the result values, in case no answer can be found.  */
5854   initial_value = 0;
5855   increment = 0;
5856
5857   /* The iteration variable can be either a giv or a biv.  Check to see
5858      which it is, and compute the variable's initial value, and increment
5859      value if possible.  */
5860
5861   /* If this is a new register, can't handle it since we don't have any
5862      reg_iv_type entry for it.  */
5863   if ((unsigned) REGNO (iteration_var) >= ivs->n_regs)
5864     {
5865       if (loop_dump_stream)
5866         fprintf (loop_dump_stream,
5867                  "Loop iterations: No reg_iv_type entry for iteration var.\n");
5868       return 0;
5869     }
5870
5871   /* Reject iteration variables larger than the host wide int size, since they
5872      could result in a number of iterations greater than the range of our
5873      `unsigned HOST_WIDE_INT' variable loop_info->n_iterations.  */
5874   else if ((GET_MODE_BITSIZE (GET_MODE (iteration_var))
5875             > HOST_BITS_PER_WIDE_INT))
5876     {
5877       if (loop_dump_stream)
5878         fprintf (loop_dump_stream,
5879                  "Loop iterations: Iteration var rejected because mode too large.\n");
5880       return 0;
5881     }
5882   else if (GET_MODE_CLASS (GET_MODE (iteration_var)) != MODE_INT)
5883     {
5884       if (loop_dump_stream)
5885         fprintf (loop_dump_stream,
5886                  "Loop iterations: Iteration var not an integer.\n");
5887       return 0;
5888     }
5889
5890   /* Try swapping the comparison to identify a suitable iv.  */
5891   if (REG_IV_TYPE (ivs, REGNO (iteration_var)) != BASIC_INDUCT
5892       && REG_IV_TYPE (ivs, REGNO (iteration_var)) != GENERAL_INDUCT
5893       && REG_P (comparison_value)
5894       && REGNO (comparison_value) < ivs->n_regs)
5895     {
5896       rtx temp = comparison_value;
5897       comparison_code = swap_condition (comparison_code);
5898       comparison_value = iteration_var;
5899       iteration_var = temp;
5900     }
5901
5902   if (REG_IV_TYPE (ivs, REGNO (iteration_var)) == BASIC_INDUCT)
5903     {
5904       gcc_assert (REGNO (iteration_var) < ivs->n_regs);
5905
5906       /* Grab initial value, only useful if it is a constant.  */
5907       bl = REG_IV_CLASS (ivs, REGNO (iteration_var));
5908       initial_value = bl->initial_value;
5909       if (!bl->biv->always_executed || bl->biv->maybe_multiple)
5910         {
5911           if (loop_dump_stream)
5912             fprintf (loop_dump_stream,
5913                      "Loop iterations: Basic induction var not set once in each iteration.\n");
5914           return 0;
5915         }
5916
5917       increment = biv_total_increment (bl);
5918     }
5919   else if (REG_IV_TYPE (ivs, REGNO (iteration_var)) == GENERAL_INDUCT)
5920     {
5921       HOST_WIDE_INT offset = 0;
5922       struct induction *v = REG_IV_INFO (ivs, REGNO (iteration_var));
5923       rtx biv_initial_value;
5924
5925       gcc_assert (REGNO (v->src_reg) < ivs->n_regs);
5926
5927       if (!v->always_executed || v->maybe_multiple)
5928         {
5929           if (loop_dump_stream)
5930             fprintf (loop_dump_stream,
5931                      "Loop iterations: General induction var not set once in each iteration.\n");
5932           return 0;
5933         }
5934
5935       bl = REG_IV_CLASS (ivs, REGNO (v->src_reg));
5936
5937       /* Increment value is mult_val times the increment value of the biv.  */
5938
5939       increment = biv_total_increment (bl);
5940       if (increment)
5941         {
5942           struct induction *biv_inc;
5943
5944           increment = fold_rtx_mult_add (v->mult_val,
5945                                          extend_value_for_giv (v, increment),
5946                                          const0_rtx, v->mode);
5947           /* The caller assumes that one full increment has occurred at the
5948              first loop test.  But that's not true when the biv is incremented
5949              after the giv is set (which is the usual case), e.g.:
5950              i = 6; do {;} while (i++ < 9) .
5951              Therefore, we bias the initial value by subtracting the amount of
5952              the increment that occurs between the giv set and the giv test.  */
5953           for (biv_inc = bl->biv; biv_inc; biv_inc = biv_inc->next_iv)
5954             {
5955               if (loop_insn_first_p (v->insn, biv_inc->insn))
5956                 {
5957                   if (REG_P (biv_inc->add_val))
5958                     {
5959                       if (loop_dump_stream)
5960                         fprintf (loop_dump_stream,
5961                                  "Loop iterations: Basic induction var add_val is REG %d.\n",
5962                                  REGNO (biv_inc->add_val));
5963                         return 0;
5964                     }
5965
5966                   /* If we have already counted it, skip it.  */
5967                   if (biv_inc->same)
5968                     continue;
5969
5970                   offset -= INTVAL (biv_inc->add_val);
5971                 }
5972             }
5973         }
5974       if (loop_dump_stream)
5975         fprintf (loop_dump_stream,
5976                  "Loop iterations: Giv iterator, initial value bias %ld.\n",
5977                  (long) offset);
5978
5979       /* Initial value is mult_val times the biv's initial value plus
5980          add_val.  Only useful if it is a constant.  */
5981       biv_initial_value = extend_value_for_giv (v, bl->initial_value);
5982       initial_value
5983         = fold_rtx_mult_add (v->mult_val,
5984                              plus_constant (biv_initial_value, offset),
5985                              v->add_val, v->mode);
5986     }
5987   else
5988     {
5989       if (loop_dump_stream)
5990         fprintf (loop_dump_stream,
5991                  "Loop iterations: Not basic or general induction var.\n");
5992       return 0;
5993     }
5994
5995   if (initial_value == 0)
5996     return 0;
5997
5998   unsigned_p = 0;
5999   off_by_one = 0;
6000   switch (comparison_code)
6001     {
6002     case LEU:
6003       unsigned_p = 1;
6004     case LE:
6005       compare_dir = 1;
6006       off_by_one = 1;
6007       break;
6008     case GEU:
6009       unsigned_p = 1;
6010     case GE:
6011       compare_dir = -1;
6012       off_by_one = -1;
6013       break;
6014     case EQ:
6015       /* Cannot determine loop iterations with this case.  */
6016       compare_dir = 0;
6017       break;
6018     case LTU:
6019       unsigned_p = 1;
6020     case LT:
6021       compare_dir = 1;
6022       break;
6023     case GTU:
6024       unsigned_p = 1;
6025     case GT:
6026       compare_dir = -1;
6027       break;
6028     case NE:
6029       compare_dir = 0;
6030       break;
6031     default:
6032       gcc_unreachable ();
6033     }
6034
6035   /* If the comparison value is an invariant register, then try to find
6036      its value from the insns before the start of the loop.  */
6037
6038   final_value = comparison_value;
6039   if (REG_P (comparison_value)
6040       && loop_invariant_p (loop, comparison_value))
6041     {
6042       final_value = loop_find_equiv_value (loop, comparison_value);
6043
6044       /* If we don't get an invariant final value, we are better
6045          off with the original register.  */
6046       if (! loop_invariant_p (loop, final_value))
6047         final_value = comparison_value;
6048     }
6049
6050   /* Calculate the approximate final value of the induction variable
6051      (on the last successful iteration).  The exact final value
6052      depends on the branch operator, and increment sign.  It will be
6053      wrong if the iteration variable is not incremented by one each
6054      time through the loop and (comparison_value + off_by_one -
6055      initial_value) % increment != 0.
6056      ??? Note that the final_value may overflow and thus final_larger
6057      will be bogus.  A potentially infinite loop will be classified
6058      as immediate, e.g. for (i = 0x7ffffff0; i <= 0x7fffffff; i++)  */
6059   if (off_by_one)
6060     final_value = plus_constant (final_value, off_by_one);
6061
6062   /* Save the calculated values describing this loop's bounds, in case
6063      precondition_loop_p will need them later.  These values can not be
6064      recalculated inside precondition_loop_p because strength reduction
6065      optimizations may obscure the loop's structure.
6066
6067      These values are only required by precondition_loop_p and insert_bct
6068      whenever the number of iterations cannot be computed at compile time.
6069      Only the difference between final_value and initial_value is
6070      important.  Note that final_value is only approximate.  */
6071   loop_info->initial_value = initial_value;
6072   loop_info->comparison_value = comparison_value;
6073   loop_info->final_value = plus_constant (comparison_value, off_by_one);
6074   loop_info->increment = increment;
6075   loop_info->iteration_var = iteration_var;
6076   loop_info->comparison_code = comparison_code;
6077   loop_info->iv = bl;
6078
6079   /* Try to determine the iteration count for loops such
6080      as (for i = init; i < init + const; i++).  When running the
6081      loop optimization twice, the first pass often converts simple
6082      loops into this form.  */
6083
6084   if (REG_P (initial_value))
6085     {
6086       rtx reg1;
6087       rtx reg2;
6088       rtx const2;
6089
6090       reg1 = initial_value;
6091       if (GET_CODE (final_value) == PLUS)
6092         reg2 = XEXP (final_value, 0), const2 = XEXP (final_value, 1);
6093       else
6094         reg2 = final_value, const2 = const0_rtx;
6095
6096       /* Check for initial_value = reg1, final_value = reg2 + const2,
6097          where reg1 != reg2.  */
6098       if (REG_P (reg2) && reg2 != reg1)
6099         {
6100           rtx temp;
6101
6102           /* Find what reg1 is equivalent to.  Hopefully it will
6103              either be reg2 or reg2 plus a constant.  */
6104           temp = loop_find_equiv_value (loop, reg1);
6105
6106           if (find_common_reg_term (temp, reg2))
6107             initial_value = temp;
6108           else if (loop_invariant_p (loop, reg2))
6109             {
6110               /* Find what reg2 is equivalent to.  Hopefully it will
6111                  either be reg1 or reg1 plus a constant.  Let's ignore
6112                  the latter case for now since it is not so common.  */
6113               temp = loop_find_equiv_value (loop, reg2);
6114
6115               if (temp == loop_info->iteration_var)
6116                 temp = initial_value;
6117               if (temp == reg1)
6118                 final_value = (const2 == const0_rtx)
6119                   ? reg1 : gen_rtx_PLUS (GET_MODE (reg1), reg1, const2);
6120             }
6121         }
6122     }
6123
6124   loop_info->initial_equiv_value = initial_value;
6125   loop_info->final_equiv_value = final_value;
6126
6127   /* For EQ comparison loops, we don't have a valid final value.
6128      Check this now so that we won't leave an invalid value if we
6129      return early for any other reason.  */
6130   if (comparison_code == EQ)
6131     loop_info->final_equiv_value = loop_info->final_value = 0;
6132
6133   if (increment == 0)
6134     {
6135       if (loop_dump_stream)
6136         fprintf (loop_dump_stream,
6137                  "Loop iterations: Increment value can't be calculated.\n");
6138       return 0;
6139     }
6140
6141   if (GET_CODE (increment) != CONST_INT)
6142     {
6143       /* If we have a REG, check to see if REG holds a constant value.  */
6144       /* ??? Other RTL, such as (neg (reg)) is possible here, but it isn't
6145          clear if it is worthwhile to try to handle such RTL.  */
6146       if (REG_P (increment) || GET_CODE (increment) == SUBREG)
6147         increment = loop_find_equiv_value (loop, increment);
6148
6149       if (GET_CODE (increment) != CONST_INT)
6150         {
6151           if (loop_dump_stream)
6152             {
6153               fprintf (loop_dump_stream,
6154                        "Loop iterations: Increment value not constant ");
6155               print_simple_rtl (loop_dump_stream, increment);
6156               fprintf (loop_dump_stream, ".\n");
6157             }
6158           return 0;
6159         }
6160       loop_info->increment = increment;
6161     }
6162
6163   if (GET_CODE (initial_value) != CONST_INT)
6164     {
6165       if (loop_dump_stream)
6166         {
6167           fprintf (loop_dump_stream,
6168                    "Loop iterations: Initial value not constant ");
6169           print_simple_rtl (loop_dump_stream, initial_value);
6170           fprintf (loop_dump_stream, ".\n");
6171         }
6172       return 0;
6173     }
6174   else if (GET_CODE (final_value) != CONST_INT)
6175     {
6176       if (loop_dump_stream)
6177         {
6178           fprintf (loop_dump_stream,
6179                    "Loop iterations: Final value not constant ");
6180           print_simple_rtl (loop_dump_stream, final_value);
6181           fprintf (loop_dump_stream, ".\n");
6182         }
6183       return 0;
6184     }
6185   else if (comparison_code == EQ)
6186     {
6187       rtx inc_once;
6188
6189       if (loop_dump_stream)
6190         fprintf (loop_dump_stream, "Loop iterations: EQ comparison loop.\n");
6191
6192       inc_once = gen_int_mode (INTVAL (initial_value) + INTVAL (increment),
6193                                GET_MODE (iteration_var));
6194
6195       if (inc_once == final_value)
6196         {
6197           /* The iterator value once through the loop is equal to the
6198              comparison value.  Either we have an infinite loop, or
6199              we'll loop twice.  */
6200           if (increment == const0_rtx)
6201             return 0;
6202           loop_info->n_iterations = 2;
6203         }
6204       else
6205         loop_info->n_iterations = 1;
6206
6207       if (GET_CODE (loop_info->initial_value) == CONST_INT)
6208         loop_info->final_value
6209           = gen_int_mode ((INTVAL (loop_info->initial_value)
6210                            + loop_info->n_iterations * INTVAL (increment)),
6211                           GET_MODE (iteration_var));
6212       else
6213         loop_info->final_value
6214           = plus_constant (loop_info->initial_value,
6215                            loop_info->n_iterations * INTVAL (increment));
6216       loop_info->final_equiv_value
6217         = gen_int_mode ((INTVAL (initial_value)
6218                          + loop_info->n_iterations * INTVAL (increment)),
6219                         GET_MODE (iteration_var));
6220       return loop_info->n_iterations;
6221     }
6222
6223   /* Final_larger is 1 if final larger, 0 if they are equal, otherwise -1.  */
6224   if (unsigned_p)
6225     final_larger
6226       = ((unsigned HOST_WIDE_INT) INTVAL (final_value)
6227          > (unsigned HOST_WIDE_INT) INTVAL (initial_value))
6228         - ((unsigned HOST_WIDE_INT) INTVAL (final_value)
6229            < (unsigned HOST_WIDE_INT) INTVAL (initial_value));
6230   else
6231     final_larger = (INTVAL (final_value) > INTVAL (initial_value))
6232       - (INTVAL (final_value) < INTVAL (initial_value));
6233
6234   if (INTVAL (increment) > 0)
6235     increment_dir = 1;
6236   else if (INTVAL (increment) == 0)
6237     increment_dir = 0;
6238   else
6239     increment_dir = -1;
6240
6241   /* There are 27 different cases: compare_dir = -1, 0, 1;
6242      final_larger = -1, 0, 1; increment_dir = -1, 0, 1.
6243      There are 4 normal cases, 4 reverse cases (where the iteration variable
6244      will overflow before the loop exits), 4 infinite loop cases, and 15
6245      immediate exit (0 or 1 iteration depending on loop type) cases.
6246      Only try to optimize the normal cases.  */
6247
6248   /* (compare_dir/final_larger/increment_dir)
6249      Normal cases: (0/-1/-1), (0/1/1), (-1/-1/-1), (1/1/1)
6250      Reverse cases: (0/-1/1), (0/1/-1), (-1/-1/1), (1/1/-1)
6251      Infinite loops: (0/-1/0), (0/1/0), (-1/-1/0), (1/1/0)
6252      Immediate exit: (0/0/X), (-1/0/X), (-1/1/X), (1/0/X), (1/-1/X) */
6253
6254   /* ?? If the meaning of reverse loops (where the iteration variable
6255      will overflow before the loop exits) is undefined, then could
6256      eliminate all of these special checks, and just always assume
6257      the loops are normal/immediate/infinite.  Note that this means
6258      the sign of increment_dir does not have to be known.  Also,
6259      since it does not really hurt if immediate exit loops or infinite loops
6260      are optimized, then that case could be ignored also, and hence all
6261      loops can be optimized.
6262
6263      According to ANSI Spec, the reverse loop case result is undefined,
6264      because the action on overflow is undefined.
6265
6266      See also the special test for NE loops below.  */
6267
6268   if (final_larger == increment_dir && final_larger != 0
6269       && (final_larger == compare_dir || compare_dir == 0))
6270     /* Normal case.  */
6271     ;
6272   else
6273     {
6274       if (loop_dump_stream)
6275         fprintf (loop_dump_stream, "Loop iterations: Not normal loop.\n");
6276       return 0;
6277     }
6278
6279   /* Calculate the number of iterations, final_value is only an approximation,
6280      so correct for that.  Note that abs_diff and n_iterations are
6281      unsigned, because they can be as large as 2^n - 1.  */
6282
6283   inc = INTVAL (increment);
6284   gcc_assert (inc);
6285   if (inc > 0)
6286     {
6287       abs_diff = INTVAL (final_value) - INTVAL (initial_value);
6288       abs_inc = inc;
6289     }
6290   else
6291     {
6292       abs_diff = INTVAL (initial_value) - INTVAL (final_value);
6293       abs_inc = -inc;
6294     }
6295
6296   /* Given that iteration_var is going to iterate over its own mode,
6297      not HOST_WIDE_INT, disregard higher bits that might have come
6298      into the picture due to sign extension of initial and final
6299      values.  */
6300   abs_diff &= ((unsigned HOST_WIDE_INT) 1
6301                << (GET_MODE_BITSIZE (GET_MODE (iteration_var)) - 1)
6302                << 1) - 1;
6303
6304   /* For NE tests, make sure that the iteration variable won't miss
6305      the final value.  If abs_diff mod abs_incr is not zero, then the
6306      iteration variable will overflow before the loop exits, and we
6307      can not calculate the number of iterations.  */
6308   if (compare_dir == 0 && (abs_diff % abs_inc) != 0)
6309     return 0;
6310
6311   /* Note that the number of iterations could be calculated using
6312      (abs_diff + abs_inc - 1) / abs_inc, provided care was taken to
6313      handle potential overflow of the summation.  */
6314   loop_info->n_iterations = abs_diff / abs_inc + ((abs_diff % abs_inc) != 0);
6315   return loop_info->n_iterations;
6316 }
6317
6318 /* Perform strength reduction and induction variable elimination.
6319
6320    Pseudo registers created during this function will be beyond the
6321    last valid index in several tables including
6322    REGS->ARRAY[I].N_TIMES_SET and REGNO_LAST_UID.  This does not cause a
6323    problem here, because the added registers cannot be givs outside of
6324    their loop, and hence will never be reconsidered.  But scan_loop
6325    must check regnos to make sure they are in bounds.  */
6326
6327 static void
6328 strength_reduce (struct loop *loop, int flags)
6329 {
6330   struct loop_info *loop_info = LOOP_INFO (loop);
6331   struct loop_regs *regs = LOOP_REGS (loop);
6332   struct loop_ivs *ivs = LOOP_IVS (loop);
6333   rtx p;
6334   /* Temporary list pointer for traversing ivs->list.  */
6335   struct iv_class *bl;
6336   /* Ratio of extra register life span we can justify
6337      for saving an instruction.  More if loop doesn't call subroutines
6338      since in that case saving an insn makes more difference
6339      and more registers are available.  */
6340   /* ??? could set this to last value of threshold in move_movables */
6341   int threshold = (loop_info->has_call ? 1 : 2) * (3 + n_non_fixed_regs);
6342   /* Map of pseudo-register replacements.  */
6343   rtx *reg_map = NULL;
6344   int reg_map_size;
6345   rtx test_reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
6346   int insn_count = count_insns_in_loop (loop);
6347
6348   addr_placeholder = gen_reg_rtx (Pmode);
6349
6350   ivs->n_regs = max_reg_before_loop;
6351   ivs->regs = xcalloc (ivs->n_regs, sizeof (struct iv));
6352
6353   /* Find all BIVs in loop.  */
6354   loop_bivs_find (loop);
6355
6356   /* Exit if there are no bivs.  */
6357   if (! ivs->list)
6358     {
6359       loop_ivs_free (loop);
6360       return;
6361     }
6362
6363   /* Determine how BIVS are initialized by looking through pre-header
6364      extended basic block.  */
6365   loop_bivs_init_find (loop);
6366
6367   /* Look at the each biv and see if we can say anything better about its
6368      initial value from any initializing insns set up above.  */
6369   loop_bivs_check (loop);
6370
6371   /* Search the loop for general induction variables.  */
6372   loop_givs_find (loop);
6373
6374   /* Try to calculate and save the number of loop iterations.  This is
6375      set to zero if the actual number can not be calculated.  This must
6376      be called after all giv's have been identified, since otherwise it may
6377      fail if the iteration variable is a giv.  */
6378   loop_iterations (loop);
6379
6380 #ifdef HAVE_prefetch
6381   if (flags & LOOP_PREFETCH)
6382     emit_prefetch_instructions (loop);
6383 #endif
6384
6385   /* Now for each giv for which we still don't know whether or not it is
6386      replaceable, check to see if it is replaceable because its final value
6387      can be calculated.  This must be done after loop_iterations is called,
6388      so that final_giv_value will work correctly.  */
6389   loop_givs_check (loop);
6390
6391   /* Try to prove that the loop counter variable (if any) is always
6392      nonnegative; if so, record that fact with a REG_NONNEG note
6393      so that "decrement and branch until zero" insn can be used.  */
6394   check_dbra_loop (loop, insn_count);
6395
6396   /* Create reg_map to hold substitutions for replaceable giv regs.
6397      Some givs might have been made from biv increments, so look at
6398      ivs->reg_iv_type for a suitable size.  */
6399   reg_map_size = ivs->n_regs;
6400   reg_map = xcalloc (reg_map_size, sizeof (rtx));
6401
6402   /* Examine each iv class for feasibility of strength reduction/induction
6403      variable elimination.  */
6404
6405   for (bl = ivs->list; bl; bl = bl->next)
6406     {
6407       struct induction *v;
6408       int benefit;
6409
6410       /* Test whether it will be possible to eliminate this biv
6411          provided all givs are reduced.  */
6412       bl->eliminable = loop_biv_eliminable_p (loop, bl, threshold, insn_count);
6413
6414       /* This will be true at the end, if all givs which depend on this
6415          biv have been strength reduced.
6416          We can't (currently) eliminate the biv unless this is so.  */
6417       bl->all_reduced = 1;
6418
6419       /* Check each extension dependent giv in this class to see if its
6420          root biv is safe from wrapping in the interior mode.  */
6421       check_ext_dependent_givs (loop, bl);
6422
6423       /* Combine all giv's for this iv_class.  */
6424       combine_givs (regs, bl);
6425
6426       for (v = bl->giv; v; v = v->next_iv)
6427         {
6428           struct induction *tv;
6429
6430           if (v->ignore || v->same)
6431             continue;
6432
6433           benefit = loop_giv_reduce_benefit (loop, bl, v, test_reg);
6434
6435           /* If an insn is not to be strength reduced, then set its ignore
6436              flag, and clear bl->all_reduced.  */
6437
6438           /* A giv that depends on a reversed biv must be reduced if it is
6439              used after the loop exit, otherwise, it would have the wrong
6440              value after the loop exit.  To make it simple, just reduce all
6441              of such giv's whether or not we know they are used after the loop
6442              exit.  */
6443
6444           if (v->lifetime * threshold * benefit < insn_count
6445               && ! bl->reversed)
6446             {
6447               if (loop_dump_stream)
6448                 fprintf (loop_dump_stream,
6449                          "giv of insn %d not worth while, %d vs %d.\n",
6450                          INSN_UID (v->insn),
6451                          v->lifetime * threshold * benefit, insn_count);
6452               v->ignore = 1;
6453               bl->all_reduced = 0;
6454             }
6455           else
6456             {
6457               /* Check that we can increment the reduced giv without a
6458                  multiply insn.  If not, reject it.  */
6459
6460               for (tv = bl->biv; tv; tv = tv->next_iv)
6461                 if (tv->mult_val == const1_rtx
6462                     && ! product_cheap_p (tv->add_val, v->mult_val))
6463                   {
6464                     if (loop_dump_stream)
6465                       fprintf (loop_dump_stream,
6466                                "giv of insn %d: would need a multiply.\n",
6467                                INSN_UID (v->insn));
6468                     v->ignore = 1;
6469                     bl->all_reduced = 0;
6470                     break;
6471                   }
6472             }
6473         }
6474
6475       /* Check for givs whose first use is their definition and whose
6476          last use is the definition of another giv.  If so, it is likely
6477          dead and should not be used to derive another giv nor to
6478          eliminate a biv.  */
6479       loop_givs_dead_check (loop, bl);
6480
6481       /* Reduce each giv that we decided to reduce.  */
6482       loop_givs_reduce (loop, bl);
6483
6484       /* Rescan all givs.  If a giv is the same as a giv not reduced, mark it
6485          as not reduced.
6486
6487          For each giv register that can be reduced now: if replaceable,
6488          substitute reduced reg wherever the old giv occurs;
6489          else add new move insn "giv_reg = reduced_reg".  */
6490       loop_givs_rescan (loop, bl, reg_map);
6491
6492       /* All the givs based on the biv bl have been reduced if they
6493          merit it.  */
6494
6495       /* For each giv not marked as maybe dead that has been combined with a
6496          second giv, clear any "maybe dead" mark on that second giv.
6497          v->new_reg will either be or refer to the register of the giv it
6498          combined with.
6499
6500          Doing this clearing avoids problems in biv elimination where
6501          a giv's new_reg is a complex value that can't be put in the
6502          insn but the giv combined with (with a reg as new_reg) is
6503          marked maybe_dead.  Since the register will be used in either
6504          case, we'd prefer it be used from the simpler giv.  */
6505
6506       for (v = bl->giv; v; v = v->next_iv)
6507         if (! v->maybe_dead && v->same)
6508           v->same->maybe_dead = 0;
6509
6510       /* Try to eliminate the biv, if it is a candidate.
6511          This won't work if ! bl->all_reduced,
6512          since the givs we planned to use might not have been reduced.
6513
6514          We have to be careful that we didn't initially think we could
6515          eliminate this biv because of a giv that we now think may be
6516          dead and shouldn't be used as a biv replacement.
6517
6518          Also, there is the possibility that we may have a giv that looks
6519          like it can be used to eliminate a biv, but the resulting insn
6520          isn't valid.  This can happen, for example, on the 88k, where a
6521          JUMP_INSN can compare a register only with zero.  Attempts to
6522          replace it with a compare with a constant will fail.
6523
6524          Note that in cases where this call fails, we may have replaced some
6525          of the occurrences of the biv with a giv, but no harm was done in
6526          doing so in the rare cases where it can occur.  */
6527
6528       if (bl->all_reduced == 1 && bl->eliminable
6529           && maybe_eliminate_biv (loop, bl, 1, threshold, insn_count))
6530         {
6531           /* ?? If we created a new test to bypass the loop entirely,
6532              or otherwise drop straight in, based on this test, then
6533              we might want to rewrite it also.  This way some later
6534              pass has more hope of removing the initialization of this
6535              biv entirely.  */
6536
6537           /* If final_value != 0, then the biv may be used after loop end
6538              and we must emit an insn to set it just in case.
6539
6540              Reversed bivs already have an insn after the loop setting their
6541              value, so we don't need another one.  We can't calculate the
6542              proper final value for such a biv here anyways.  */
6543           if (bl->final_value && ! bl->reversed)
6544               loop_insn_sink_or_swim (loop,
6545                                       gen_load_of_final_value (bl->biv->dest_reg,
6546                                                                bl->final_value));
6547
6548           if (loop_dump_stream)
6549             fprintf (loop_dump_stream, "Reg %d: biv eliminated\n",
6550                      bl->regno);
6551         }
6552       /* See above note wrt final_value.  But since we couldn't eliminate
6553          the biv, we must set the value after the loop instead of before.  */
6554       else if (bl->final_value && ! bl->reversed)
6555         loop_insn_sink (loop, gen_load_of_final_value (bl->biv->dest_reg,
6556                                                        bl->final_value));
6557     }
6558
6559   /* Go through all the instructions in the loop, making all the
6560      register substitutions scheduled in REG_MAP.  */
6561
6562   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
6563     if (INSN_P (p))
6564       {
6565         replace_regs (PATTERN (p), reg_map, reg_map_size, 0);
6566         replace_regs (REG_NOTES (p), reg_map, reg_map_size, 0);
6567         INSN_CODE (p) = -1;
6568       }
6569
6570   if (loop_dump_stream)
6571     fprintf (loop_dump_stream, "\n");
6572
6573   loop_ivs_free (loop);
6574   if (reg_map)
6575     free (reg_map);
6576 }
6577 \f
6578 /*Record all basic induction variables calculated in the insn.  */
6579 static rtx
6580 check_insn_for_bivs (struct loop *loop, rtx p, int not_every_iteration,
6581                      int maybe_multiple)
6582 {
6583   struct loop_ivs *ivs = LOOP_IVS (loop);
6584   rtx set;
6585   rtx dest_reg;
6586   rtx inc_val;
6587   rtx mult_val;
6588   rtx *location;
6589
6590   if (NONJUMP_INSN_P (p)
6591       && (set = single_set (p))
6592       && REG_P (SET_DEST (set)))
6593     {
6594       dest_reg = SET_DEST (set);
6595       if (REGNO (dest_reg) < max_reg_before_loop
6596           && REGNO (dest_reg) >= FIRST_PSEUDO_REGISTER
6597           && REG_IV_TYPE (ivs, REGNO (dest_reg)) != NOT_BASIC_INDUCT)
6598         {
6599           if (basic_induction_var (loop, SET_SRC (set),
6600                                    GET_MODE (SET_SRC (set)),
6601                                    dest_reg, p, &inc_val, &mult_val,
6602                                    &location))
6603             {
6604               /* It is a possible basic induction variable.
6605                  Create and initialize an induction structure for it.  */
6606
6607               struct induction *v = xmalloc (sizeof (struct induction));
6608
6609               record_biv (loop, v, p, dest_reg, inc_val, mult_val, location,
6610                           not_every_iteration, maybe_multiple);
6611               REG_IV_TYPE (ivs, REGNO (dest_reg)) = BASIC_INDUCT;
6612             }
6613           else if (REGNO (dest_reg) < ivs->n_regs)
6614             REG_IV_TYPE (ivs, REGNO (dest_reg)) = NOT_BASIC_INDUCT;
6615         }
6616     }
6617   return p;
6618 }
6619 \f
6620 /* Record all givs calculated in the insn.
6621    A register is a giv if: it is only set once, it is a function of a
6622    biv and a constant (or invariant), and it is not a biv.  */
6623 static rtx
6624 check_insn_for_givs (struct loop *loop, rtx p, int not_every_iteration,
6625                      int maybe_multiple)
6626 {
6627   struct loop_regs *regs = LOOP_REGS (loop);
6628
6629   rtx set;
6630   /* Look for a general induction variable in a register.  */
6631   if (NONJUMP_INSN_P (p)
6632       && (set = single_set (p))
6633       && REG_P (SET_DEST (set))
6634       && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
6635     {
6636       rtx src_reg;
6637       rtx dest_reg;
6638       rtx add_val;
6639       rtx mult_val;
6640       rtx ext_val;
6641       int benefit;
6642       rtx regnote = 0;
6643       rtx last_consec_insn;
6644
6645       dest_reg = SET_DEST (set);
6646       if (REGNO (dest_reg) < FIRST_PSEUDO_REGISTER)
6647         return p;
6648
6649       if (/* SET_SRC is a giv.  */
6650           (general_induction_var (loop, SET_SRC (set), &src_reg, &add_val,
6651                                   &mult_val, &ext_val, 0, &benefit, VOIDmode)
6652            /* Equivalent expression is a giv.  */
6653            || ((regnote = find_reg_note (p, REG_EQUAL, NULL_RTX))
6654                && general_induction_var (loop, XEXP (regnote, 0), &src_reg,
6655                                          &add_val, &mult_val, &ext_val, 0,
6656                                          &benefit, VOIDmode)))
6657           /* Don't try to handle any regs made by loop optimization.
6658              We have nothing on them in regno_first_uid, etc.  */
6659           && REGNO (dest_reg) < max_reg_before_loop
6660           /* Don't recognize a BASIC_INDUCT_VAR here.  */
6661           && dest_reg != src_reg
6662           /* This must be the only place where the register is set.  */
6663           && (regs->array[REGNO (dest_reg)].n_times_set == 1
6664               /* or all sets must be consecutive and make a giv.  */
6665               || (benefit = consec_sets_giv (loop, benefit, p,
6666                                              src_reg, dest_reg,
6667                                              &add_val, &mult_val, &ext_val,
6668                                              &last_consec_insn))))
6669         {
6670           struct induction *v = xmalloc (sizeof (struct induction));
6671
6672           /* If this is a library call, increase benefit.  */
6673           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
6674             benefit += libcall_benefit (p);
6675
6676           /* Skip the consecutive insns, if there are any.  */
6677           if (regs->array[REGNO (dest_reg)].n_times_set != 1)
6678             p = last_consec_insn;
6679
6680           record_giv (loop, v, p, src_reg, dest_reg, mult_val, add_val,
6681                       ext_val, benefit, DEST_REG, not_every_iteration,
6682                       maybe_multiple, (rtx*) 0);
6683
6684         }
6685     }
6686
6687   /* Look for givs which are memory addresses.  */
6688   if (NONJUMP_INSN_P (p))
6689     find_mem_givs (loop, PATTERN (p), p, not_every_iteration,
6690                    maybe_multiple);
6691
6692   /* Update the status of whether giv can derive other givs.  This can
6693      change when we pass a label or an insn that updates a biv.  */
6694   if (INSN_P (p) || LABEL_P (p))
6695     update_giv_derive (loop, p);
6696   return p;
6697 }
6698 \f
6699 /* Return 1 if X is a valid source for an initial value (or as value being
6700    compared against in an initial test).
6701
6702    X must be either a register or constant and must not be clobbered between
6703    the current insn and the start of the loop.
6704
6705    INSN is the insn containing X.  */
6706
6707 static int
6708 valid_initial_value_p (rtx x, rtx insn, int call_seen, rtx loop_start)
6709 {
6710   if (CONSTANT_P (x))
6711     return 1;
6712
6713   /* Only consider pseudos we know about initialized in insns whose luids
6714      we know.  */
6715   if (!REG_P (x)
6716       || REGNO (x) >= max_reg_before_loop)
6717     return 0;
6718
6719   /* Don't use call-clobbered registers across a call which clobbers it.  On
6720      some machines, don't use any hard registers at all.  */
6721   if (REGNO (x) < FIRST_PSEUDO_REGISTER
6722       && (SMALL_REGISTER_CLASSES
6723           || (call_seen
6724               && TEST_HARD_REG_BIT (regs_invalidated_by_call, REGNO (x)))))
6725     return 0;
6726
6727   /* Don't use registers that have been clobbered before the start of the
6728      loop.  */
6729   if (reg_set_between_p (x, insn, loop_start))
6730     return 0;
6731
6732   return 1;
6733 }
6734 \f
6735 /* Scan X for memory refs and check each memory address
6736    as a possible giv.  INSN is the insn whose pattern X comes from.
6737    NOT_EVERY_ITERATION is 1 if the insn might not be executed during
6738    every loop iteration.  MAYBE_MULTIPLE is 1 if the insn might be executed
6739    more than once in each loop iteration.  */
6740
6741 static void
6742 find_mem_givs (const struct loop *loop, rtx x, rtx insn,
6743                int not_every_iteration, int maybe_multiple)
6744 {
6745   int i, j;
6746   enum rtx_code code;
6747   const char *fmt;
6748
6749   if (x == 0)
6750     return;
6751
6752   code = GET_CODE (x);
6753   switch (code)
6754     {
6755     case REG:
6756     case CONST_INT:
6757     case CONST:
6758     case CONST_DOUBLE:
6759     case SYMBOL_REF:
6760     case LABEL_REF:
6761     case PC:
6762     case CC0:
6763     case ADDR_VEC:
6764     case ADDR_DIFF_VEC:
6765     case USE:
6766     case CLOBBER:
6767       return;
6768
6769     case MEM:
6770       {
6771         rtx src_reg;
6772         rtx add_val;
6773         rtx mult_val;
6774         rtx ext_val;
6775         int benefit;
6776
6777         /* This code used to disable creating GIVs with mult_val == 1 and
6778            add_val == 0.  However, this leads to lost optimizations when
6779            it comes time to combine a set of related DEST_ADDR GIVs, since
6780            this one would not be seen.  */
6781
6782         if (general_induction_var (loop, XEXP (x, 0), &src_reg, &add_val,
6783                                    &mult_val, &ext_val, 1, &benefit,
6784                                    GET_MODE (x)))
6785           {
6786             /* Found one; record it.  */
6787             struct induction *v = xmalloc (sizeof (struct induction));
6788
6789             record_giv (loop, v, insn, src_reg, addr_placeholder, mult_val,
6790                         add_val, ext_val, benefit, DEST_ADDR,
6791                         not_every_iteration, maybe_multiple, &XEXP (x, 0));
6792
6793             v->mem = x;
6794           }
6795       }
6796       return;
6797
6798     default:
6799       break;
6800     }
6801
6802   /* Recursively scan the subexpressions for other mem refs.  */
6803
6804   fmt = GET_RTX_FORMAT (code);
6805   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
6806     if (fmt[i] == 'e')
6807       find_mem_givs (loop, XEXP (x, i), insn, not_every_iteration,
6808                      maybe_multiple);
6809     else if (fmt[i] == 'E')
6810       for (j = 0; j < XVECLEN (x, i); j++)
6811         find_mem_givs (loop, XVECEXP (x, i, j), insn, not_every_iteration,
6812                        maybe_multiple);
6813 }
6814 \f
6815 /* Fill in the data about one biv update.
6816    V is the `struct induction' in which we record the biv.  (It is
6817    allocated by the caller, with alloca.)
6818    INSN is the insn that sets it.
6819    DEST_REG is the biv's reg.
6820
6821    MULT_VAL is const1_rtx if the biv is being incremented here, in which case
6822    INC_VAL is the increment.  Otherwise, MULT_VAL is const0_rtx and the biv is
6823    being set to INC_VAL.
6824
6825    NOT_EVERY_ITERATION is nonzero if this biv update is not know to be
6826    executed every iteration; MAYBE_MULTIPLE is nonzero if this biv update
6827    can be executed more than once per iteration.  If MAYBE_MULTIPLE
6828    and NOT_EVERY_ITERATION are both zero, we know that the biv update is
6829    executed exactly once per iteration.  */
6830
6831 static void
6832 record_biv (struct loop *loop, struct induction *v, rtx insn, rtx dest_reg,
6833             rtx inc_val, rtx mult_val, rtx *location,
6834             int not_every_iteration, int maybe_multiple)
6835 {
6836   struct loop_ivs *ivs = LOOP_IVS (loop);
6837   struct iv_class *bl;
6838
6839   v->insn = insn;
6840   v->src_reg = dest_reg;
6841   v->dest_reg = dest_reg;
6842   v->mult_val = mult_val;
6843   v->add_val = inc_val;
6844   v->ext_dependent = NULL_RTX;
6845   v->location = location;
6846   v->mode = GET_MODE (dest_reg);
6847   v->always_computable = ! not_every_iteration;
6848   v->always_executed = ! not_every_iteration;
6849   v->maybe_multiple = maybe_multiple;
6850   v->same = 0;
6851
6852   /* Add this to the reg's iv_class, creating a class
6853      if this is the first incrementation of the reg.  */
6854
6855   bl = REG_IV_CLASS (ivs, REGNO (dest_reg));
6856   if (bl == 0)
6857     {
6858       /* Create and initialize new iv_class.  */
6859
6860       bl = xmalloc (sizeof (struct iv_class));
6861
6862       bl->regno = REGNO (dest_reg);
6863       bl->biv = 0;
6864       bl->giv = 0;
6865       bl->biv_count = 0;
6866       bl->giv_count = 0;
6867
6868       /* Set initial value to the reg itself.  */
6869       bl->initial_value = dest_reg;
6870       bl->final_value = 0;
6871       /* We haven't seen the initializing insn yet.  */
6872       bl->init_insn = 0;
6873       bl->init_set = 0;
6874       bl->initial_test = 0;
6875       bl->incremented = 0;
6876       bl->eliminable = 0;
6877       bl->nonneg = 0;
6878       bl->reversed = 0;
6879       bl->total_benefit = 0;
6880
6881       /* Add this class to ivs->list.  */
6882       bl->next = ivs->list;
6883       ivs->list = bl;
6884
6885       /* Put it in the array of biv register classes.  */
6886       REG_IV_CLASS (ivs, REGNO (dest_reg)) = bl;
6887     }
6888   else
6889     {
6890       /* Check if location is the same as a previous one.  */
6891       struct induction *induction;
6892       for (induction = bl->biv; induction; induction = induction->next_iv)
6893         if (location == induction->location)
6894           {
6895             v->same = induction;
6896             break;
6897           }
6898     }
6899
6900   /* Update IV_CLASS entry for this biv.  */
6901   v->next_iv = bl->biv;
6902   bl->biv = v;
6903   bl->biv_count++;
6904   if (mult_val == const1_rtx)
6905     bl->incremented = 1;
6906
6907   if (loop_dump_stream)
6908     loop_biv_dump (v, loop_dump_stream, 0);
6909 }
6910 \f
6911 /* Fill in the data about one giv.
6912    V is the `struct induction' in which we record the giv.  (It is
6913    allocated by the caller, with alloca.)
6914    INSN is the insn that sets it.
6915    BENEFIT estimates the savings from deleting this insn.
6916    TYPE is DEST_REG or DEST_ADDR; it says whether the giv is computed
6917    into a register or is used as a memory address.
6918
6919    SRC_REG is the biv reg which the giv is computed from.
6920    DEST_REG is the giv's reg (if the giv is stored in a reg).
6921    MULT_VAL and ADD_VAL are the coefficients used to compute the giv.
6922    LOCATION points to the place where this giv's value appears in INSN.  */
6923
6924 static void
6925 record_giv (const struct loop *loop, struct induction *v, rtx insn,
6926             rtx src_reg, rtx dest_reg, rtx mult_val, rtx add_val,
6927             rtx ext_val, int benefit, enum g_types type,
6928             int not_every_iteration, int maybe_multiple, rtx *location)
6929 {
6930   struct loop_ivs *ivs = LOOP_IVS (loop);
6931   struct induction *b;
6932   struct iv_class *bl;
6933   rtx set = single_set (insn);
6934   rtx temp;
6935
6936   /* Attempt to prove constantness of the values.  Don't let simplify_rtx
6937      undo the MULT canonicalization that we performed earlier.  */
6938   temp = simplify_rtx (add_val);
6939   if (temp
6940       && ! (GET_CODE (add_val) == MULT
6941             && GET_CODE (temp) == ASHIFT))
6942     add_val = temp;
6943
6944   v->insn = insn;
6945   v->src_reg = src_reg;
6946   v->giv_type = type;
6947   v->dest_reg = dest_reg;
6948   v->mult_val = mult_val;
6949   v->add_val = add_val;
6950   v->ext_dependent = ext_val;
6951   v->benefit = benefit;
6952   v->location = location;
6953   v->cant_derive = 0;
6954   v->combined_with = 0;
6955   v->maybe_multiple = maybe_multiple;
6956   v->maybe_dead = 0;
6957   v->derive_adjustment = 0;
6958   v->same = 0;
6959   v->ignore = 0;
6960   v->new_reg = 0;
6961   v->final_value = 0;
6962   v->same_insn = 0;
6963   v->auto_inc_opt = 0;
6964   v->shared = 0;
6965
6966   /* The v->always_computable field is used in update_giv_derive, to
6967      determine whether a giv can be used to derive another giv.  For a
6968      DEST_REG giv, INSN computes a new value for the giv, so its value
6969      isn't computable if INSN insn't executed every iteration.
6970      However, for a DEST_ADDR giv, INSN merely uses the value of the giv;
6971      it does not compute a new value.  Hence the value is always computable
6972      regardless of whether INSN is executed each iteration.  */
6973
6974   if (type == DEST_ADDR)
6975     v->always_computable = 1;
6976   else
6977     v->always_computable = ! not_every_iteration;
6978
6979   v->always_executed = ! not_every_iteration;
6980
6981   if (type == DEST_ADDR)
6982     {
6983       v->mode = GET_MODE (*location);
6984       v->lifetime = 1;
6985     }
6986   else /* type == DEST_REG */
6987     {
6988       v->mode = GET_MODE (SET_DEST (set));
6989
6990       v->lifetime = LOOP_REG_LIFETIME (loop, REGNO (dest_reg));
6991
6992       /* If the lifetime is zero, it means that this register is
6993          really a dead store.  So mark this as a giv that can be
6994          ignored.  This will not prevent the biv from being eliminated.  */
6995       if (v->lifetime == 0)
6996         v->ignore = 1;
6997
6998       REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
6999       REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
7000     }
7001
7002   /* Add the giv to the class of givs computed from one biv.  */
7003
7004   bl = REG_IV_CLASS (ivs, REGNO (src_reg));
7005   gcc_assert (bl);
7006   v->next_iv = bl->giv;
7007   bl->giv = v;
7008
7009   /* Don't count DEST_ADDR.  This is supposed to count the number of
7010      insns that calculate givs.  */
7011   if (type == DEST_REG)
7012     bl->giv_count++;
7013   bl->total_benefit += benefit;
7014
7015   if (type == DEST_ADDR)
7016     {
7017       v->replaceable = 1;
7018       v->not_replaceable = 0;
7019     }
7020   else
7021     {
7022       /* The giv can be replaced outright by the reduced register only if all
7023          of the following conditions are true:
7024          - the insn that sets the giv is always executed on any iteration
7025            on which the giv is used at all
7026            (there are two ways to deduce this:
7027             either the insn is executed on every iteration,
7028             or all uses follow that insn in the same basic block),
7029          - the giv is not used outside the loop
7030          - no assignments to the biv occur during the giv's lifetime.  */
7031
7032       if (REGNO_FIRST_UID (REGNO (dest_reg)) == INSN_UID (insn)
7033           /* Previous line always fails if INSN was moved by loop opt.  */
7034           && REGNO_LAST_LUID (REGNO (dest_reg))
7035           < INSN_LUID (loop->end)
7036           && (! not_every_iteration
7037               || last_use_this_basic_block (dest_reg, insn)))
7038         {
7039           /* Now check that there are no assignments to the biv within the
7040              giv's lifetime.  This requires two separate checks.  */
7041
7042           /* Check each biv update, and fail if any are between the first
7043              and last use of the giv.
7044
7045              If this loop contains an inner loop that was unrolled, then
7046              the insn modifying the biv may have been emitted by the loop
7047              unrolling code, and hence does not have a valid luid.  Just
7048              mark the biv as not replaceable in this case.  It is not very
7049              useful as a biv, because it is used in two different loops.
7050              It is very unlikely that we would be able to optimize the giv
7051              using this biv anyways.  */
7052
7053           v->replaceable = 1;
7054           v->not_replaceable = 0;
7055           for (b = bl->biv; b; b = b->next_iv)
7056             {
7057               if (INSN_UID (b->insn) >= max_uid_for_loop
7058                   || ((INSN_LUID (b->insn)
7059                        >= REGNO_FIRST_LUID (REGNO (dest_reg)))
7060                       && (INSN_LUID (b->insn)
7061                           <= REGNO_LAST_LUID (REGNO (dest_reg)))))
7062                 {
7063                   v->replaceable = 0;
7064                   v->not_replaceable = 1;
7065                   break;
7066                 }
7067             }
7068
7069           /* If there are any backwards branches that go from after the
7070              biv update to before it, then this giv is not replaceable.  */
7071           if (v->replaceable)
7072             for (b = bl->biv; b; b = b->next_iv)
7073               if (back_branch_in_range_p (loop, b->insn))
7074                 {
7075                   v->replaceable = 0;
7076                   v->not_replaceable = 1;
7077                   break;
7078                 }
7079         }
7080       else
7081         {
7082           /* May still be replaceable, we don't have enough info here to
7083              decide.  */
7084           v->replaceable = 0;
7085           v->not_replaceable = 0;
7086         }
7087     }
7088
7089   /* Record whether the add_val contains a const_int, for later use by
7090      combine_givs.  */
7091   {
7092     rtx tem = add_val;
7093
7094     v->no_const_addval = 1;
7095     if (tem == const0_rtx)
7096       ;
7097     else if (CONSTANT_P (add_val))
7098       v->no_const_addval = 0;
7099     if (GET_CODE (tem) == PLUS)
7100       {
7101         while (1)
7102           {
7103             if (GET_CODE (XEXP (tem, 0)) == PLUS)
7104               tem = XEXP (tem, 0);
7105             else if (GET_CODE (XEXP (tem, 1)) == PLUS)
7106               tem = XEXP (tem, 1);
7107             else
7108               break;
7109           }
7110         if (CONSTANT_P (XEXP (tem, 1)))
7111           v->no_const_addval = 0;
7112       }
7113   }
7114
7115   if (loop_dump_stream)
7116     loop_giv_dump (v, loop_dump_stream, 0);
7117 }
7118
7119 /* Try to calculate the final value of the giv, the value it will have at
7120    the end of the loop.  If we can do it, return that value.  */
7121
7122 static rtx
7123 final_giv_value (const struct loop *loop, struct induction *v)
7124 {
7125   struct loop_ivs *ivs = LOOP_IVS (loop);
7126   struct iv_class *bl;
7127   rtx insn;
7128   rtx increment, tem;
7129   rtx seq;
7130   rtx loop_end = loop->end;
7131   unsigned HOST_WIDE_INT n_iterations = LOOP_INFO (loop)->n_iterations;
7132
7133   bl = REG_IV_CLASS (ivs, REGNO (v->src_reg));
7134
7135   /* The final value for givs which depend on reversed bivs must be calculated
7136      differently than for ordinary givs.  In this case, there is already an
7137      insn after the loop which sets this giv's final value (if necessary),
7138      and there are no other loop exits, so we can return any value.  */
7139   if (bl->reversed)
7140     {
7141       if (loop_dump_stream)
7142         fprintf (loop_dump_stream,
7143                  "Final giv value for %d, depends on reversed biv\n",
7144                  REGNO (v->dest_reg));
7145       return const0_rtx;
7146     }
7147
7148   /* Try to calculate the final value as a function of the biv it depends
7149      upon.  The only exit from the loop must be the fall through at the bottom
7150      and the insn that sets the giv must be executed on every iteration
7151      (otherwise the giv may not have its final value when the loop exits).  */
7152
7153   /* ??? Can calculate the final giv value by subtracting off the
7154      extra biv increments times the giv's mult_val.  The loop must have
7155      only one exit for this to work, but the loop iterations does not need
7156      to be known.  */
7157
7158   if (n_iterations != 0
7159       && ! loop->exit_count
7160       && v->always_executed)
7161     {
7162       /* ?? It is tempting to use the biv's value here since these insns will
7163          be put after the loop, and hence the biv will have its final value
7164          then.  However, this fails if the biv is subsequently eliminated.
7165          Perhaps determine whether biv's are eliminable before trying to
7166          determine whether giv's are replaceable so that we can use the
7167          biv value here if it is not eliminable.  */
7168
7169       /* We are emitting code after the end of the loop, so we must make
7170          sure that bl->initial_value is still valid then.  It will still
7171          be valid if it is invariant.  */
7172
7173       increment = biv_total_increment (bl);
7174
7175       if (increment && loop_invariant_p (loop, increment)
7176           && loop_invariant_p (loop, bl->initial_value))
7177         {
7178           /* Can calculate the loop exit value of its biv as
7179              (n_iterations * increment) + initial_value */
7180
7181           /* The loop exit value of the giv is then
7182              (final_biv_value - extra increments) * mult_val + add_val.
7183              The extra increments are any increments to the biv which
7184              occur in the loop after the giv's value is calculated.
7185              We must search from the insn that sets the giv to the end
7186              of the loop to calculate this value.  */
7187
7188           /* Put the final biv value in tem.  */
7189           tem = gen_reg_rtx (v->mode);
7190           record_base_value (REGNO (tem), bl->biv->add_val, 0);
7191           loop_iv_add_mult_sink (loop, extend_value_for_giv (v, increment),
7192                                  GEN_INT (n_iterations),
7193                                  extend_value_for_giv (v, bl->initial_value),
7194                                  tem);
7195
7196           /* Subtract off extra increments as we find them.  */
7197           for (insn = NEXT_INSN (v->insn); insn != loop_end;
7198                insn = NEXT_INSN (insn))
7199             {
7200               struct induction *biv;
7201
7202               for (biv = bl->biv; biv; biv = biv->next_iv)
7203                 if (biv->insn == insn)
7204                   {
7205                     start_sequence ();
7206                     tem = expand_simple_binop (GET_MODE (tem), MINUS, tem,
7207                                                biv->add_val, NULL_RTX, 0,
7208                                                OPTAB_LIB_WIDEN);
7209                     seq = get_insns ();
7210                     end_sequence ();
7211                     loop_insn_sink (loop, seq);
7212                   }
7213             }
7214
7215           /* Now calculate the giv's final value.  */
7216           loop_iv_add_mult_sink (loop, tem, v->mult_val, v->add_val, tem);
7217
7218           if (loop_dump_stream)
7219             fprintf (loop_dump_stream,
7220                      "Final giv value for %d, calc from biv's value.\n",
7221                      REGNO (v->dest_reg));
7222
7223           return tem;
7224         }
7225     }
7226
7227   /* Replaceable giv's should never reach here.  */
7228   gcc_assert (!v->replaceable);
7229
7230   /* Check to see if the biv is dead at all loop exits.  */
7231   if (reg_dead_after_loop (loop, v->dest_reg))
7232     {
7233       if (loop_dump_stream)
7234         fprintf (loop_dump_stream,
7235                  "Final giv value for %d, giv dead after loop exit.\n",
7236                  REGNO (v->dest_reg));
7237
7238       return const0_rtx;
7239     }
7240
7241   return 0;
7242 }
7243
7244 /* All this does is determine whether a giv can be made replaceable because
7245    its final value can be calculated.  This code can not be part of record_giv
7246    above, because final_giv_value requires that the number of loop iterations
7247    be known, and that can not be accurately calculated until after all givs
7248    have been identified.  */
7249
7250 static void
7251 check_final_value (const struct loop *loop, struct induction *v)
7252 {
7253   rtx final_value = 0;
7254
7255   /* DEST_ADDR givs will never reach here, because they are always marked
7256      replaceable above in record_giv.  */
7257
7258   /* The giv can be replaced outright by the reduced register only if all
7259      of the following conditions are true:
7260      - the insn that sets the giv is always executed on any iteration
7261        on which the giv is used at all
7262        (there are two ways to deduce this:
7263         either the insn is executed on every iteration,
7264         or all uses follow that insn in the same basic block),
7265      - its final value can be calculated (this condition is different
7266        than the one above in record_giv)
7267      - it's not used before the it's set
7268      - no assignments to the biv occur during the giv's lifetime.  */
7269
7270 #if 0
7271   /* This is only called now when replaceable is known to be false.  */
7272   /* Clear replaceable, so that it won't confuse final_giv_value.  */
7273   v->replaceable = 0;
7274 #endif
7275
7276   if ((final_value = final_giv_value (loop, v))
7277       && (v->always_executed
7278           || last_use_this_basic_block (v->dest_reg, v->insn)))
7279     {
7280       int biv_increment_seen = 0, before_giv_insn = 0;
7281       rtx p = v->insn;
7282       rtx last_giv_use;
7283
7284       v->replaceable = 1;
7285       v->not_replaceable = 0;
7286
7287       /* When trying to determine whether or not a biv increment occurs
7288          during the lifetime of the giv, we can ignore uses of the variable
7289          outside the loop because final_value is true.  Hence we can not
7290          use regno_last_uid and regno_first_uid as above in record_giv.  */
7291
7292       /* Search the loop to determine whether any assignments to the
7293          biv occur during the giv's lifetime.  Start with the insn
7294          that sets the giv, and search around the loop until we come
7295          back to that insn again.
7296
7297          Also fail if there is a jump within the giv's lifetime that jumps
7298          to somewhere outside the lifetime but still within the loop.  This
7299          catches spaghetti code where the execution order is not linear, and
7300          hence the above test fails.  Here we assume that the giv lifetime
7301          does not extend from one iteration of the loop to the next, so as
7302          to make the test easier.  Since the lifetime isn't known yet,
7303          this requires two loops.  See also record_giv above.  */
7304
7305       last_giv_use = v->insn;
7306
7307       while (1)
7308         {
7309           p = NEXT_INSN (p);
7310           if (p == loop->end)
7311             {
7312               before_giv_insn = 1;
7313               p = NEXT_INSN (loop->start);
7314             }
7315           if (p == v->insn)
7316             break;
7317
7318           if (INSN_P (p))
7319             {
7320               /* It is possible for the BIV increment to use the GIV if we
7321                  have a cycle.  Thus we must be sure to check each insn for
7322                  both BIV and GIV uses, and we must check for BIV uses
7323                  first.  */
7324
7325               if (! biv_increment_seen
7326                   && reg_set_p (v->src_reg, PATTERN (p)))
7327                 biv_increment_seen = 1;
7328
7329               if (reg_mentioned_p (v->dest_reg, PATTERN (p)))
7330                 {
7331                   if (biv_increment_seen || before_giv_insn)
7332                     {
7333                       v->replaceable = 0;
7334                       v->not_replaceable = 1;
7335                       break;
7336                     }
7337                   last_giv_use = p;
7338                 }
7339             }
7340         }
7341
7342       /* Now that the lifetime of the giv is known, check for branches
7343          from within the lifetime to outside the lifetime if it is still
7344          replaceable.  */
7345
7346       if (v->replaceable)
7347         {
7348           p = v->insn;
7349           while (1)
7350             {
7351               p = NEXT_INSN (p);
7352               if (p == loop->end)
7353                 p = NEXT_INSN (loop->start);
7354               if (p == last_giv_use)
7355                 break;
7356
7357               if (JUMP_P (p) && JUMP_LABEL (p)
7358                   && LABEL_NAME (JUMP_LABEL (p))
7359                   && ((loop_insn_first_p (JUMP_LABEL (p), v->insn)
7360                        && loop_insn_first_p (loop->start, JUMP_LABEL (p)))
7361                       || (loop_insn_first_p (last_giv_use, JUMP_LABEL (p))
7362                           && loop_insn_first_p (JUMP_LABEL (p), loop->end))))
7363                 {
7364                   v->replaceable = 0;
7365                   v->not_replaceable = 1;
7366
7367                   if (loop_dump_stream)
7368                     fprintf (loop_dump_stream,
7369                              "Found branch outside giv lifetime.\n");
7370
7371                   break;
7372                 }
7373             }
7374         }
7375
7376       /* If it is replaceable, then save the final value.  */
7377       if (v->replaceable)
7378         v->final_value = final_value;
7379     }
7380
7381   if (loop_dump_stream && v->replaceable)
7382     fprintf (loop_dump_stream, "Insn %d: giv reg %d final_value replaceable\n",
7383              INSN_UID (v->insn), REGNO (v->dest_reg));
7384 }
7385 \f
7386 /* Update the status of whether a giv can derive other givs.
7387
7388    We need to do something special if there is or may be an update to the biv
7389    between the time the giv is defined and the time it is used to derive
7390    another giv.
7391
7392    In addition, a giv that is only conditionally set is not allowed to
7393    derive another giv once a label has been passed.
7394
7395    The cases we look at are when a label or an update to a biv is passed.  */
7396
7397 static void
7398 update_giv_derive (const struct loop *loop, rtx p)
7399 {
7400   struct loop_ivs *ivs = LOOP_IVS (loop);
7401   struct iv_class *bl;
7402   struct induction *biv, *giv;
7403   rtx tem;
7404   int dummy;
7405
7406   /* Search all IV classes, then all bivs, and finally all givs.
7407
7408      There are three cases we are concerned with.  First we have the situation
7409      of a giv that is only updated conditionally.  In that case, it may not
7410      derive any givs after a label is passed.
7411
7412      The second case is when a biv update occurs, or may occur, after the
7413      definition of a giv.  For certain biv updates (see below) that are
7414      known to occur between the giv definition and use, we can adjust the
7415      giv definition.  For others, or when the biv update is conditional,
7416      we must prevent the giv from deriving any other givs.  There are two
7417      sub-cases within this case.
7418
7419      If this is a label, we are concerned with any biv update that is done
7420      conditionally, since it may be done after the giv is defined followed by
7421      a branch here (actually, we need to pass both a jump and a label, but
7422      this extra tracking doesn't seem worth it).
7423
7424      If this is a jump, we are concerned about any biv update that may be
7425      executed multiple times.  We are actually only concerned about
7426      backward jumps, but it is probably not worth performing the test
7427      on the jump again here.
7428
7429      If this is a biv update, we must adjust the giv status to show that a
7430      subsequent biv update was performed.  If this adjustment cannot be done,
7431      the giv cannot derive further givs.  */
7432
7433   for (bl = ivs->list; bl; bl = bl->next)
7434     for (biv = bl->biv; biv; biv = biv->next_iv)
7435       if (LABEL_P (p) || JUMP_P (p)
7436           || biv->insn == p)
7437         {
7438           /* Skip if location is the same as a previous one.  */
7439           if (biv->same)
7440             continue;
7441
7442           for (giv = bl->giv; giv; giv = giv->next_iv)
7443             {
7444               /* If cant_derive is already true, there is no point in
7445                  checking all of these conditions again.  */
7446               if (giv->cant_derive)
7447                 continue;
7448
7449               /* If this giv is conditionally set and we have passed a label,
7450                  it cannot derive anything.  */
7451               if (LABEL_P (p) && ! giv->always_computable)
7452                 giv->cant_derive = 1;
7453
7454               /* Skip givs that have mult_val == 0, since
7455                  they are really invariants.  Also skip those that are
7456                  replaceable, since we know their lifetime doesn't contain
7457                  any biv update.  */
7458               else if (giv->mult_val == const0_rtx || giv->replaceable)
7459                 continue;
7460
7461               /* The only way we can allow this giv to derive another
7462                  is if this is a biv increment and we can form the product
7463                  of biv->add_val and giv->mult_val.  In this case, we will
7464                  be able to compute a compensation.  */
7465               else if (biv->insn == p)
7466                 {
7467                   rtx ext_val_dummy;
7468
7469                   tem = 0;
7470                   if (biv->mult_val == const1_rtx)
7471                     tem = simplify_giv_expr (loop,
7472                                              gen_rtx_MULT (giv->mode,
7473                                                            biv->add_val,
7474                                                            giv->mult_val),
7475                                              &ext_val_dummy, &dummy);
7476
7477                   if (tem && giv->derive_adjustment)
7478                     tem = simplify_giv_expr
7479                       (loop,
7480                        gen_rtx_PLUS (giv->mode, tem, giv->derive_adjustment),
7481                        &ext_val_dummy, &dummy);
7482
7483                   if (tem)
7484                     giv->derive_adjustment = tem;
7485                   else
7486                     giv->cant_derive = 1;
7487                 }
7488               else if ((LABEL_P (p) && ! biv->always_computable)
7489                        || (JUMP_P (p) && biv->maybe_multiple))
7490                 giv->cant_derive = 1;
7491             }
7492         }
7493 }
7494 \f
7495 /* Check whether an insn is an increment legitimate for a basic induction var.
7496    X is the source of insn P, or a part of it.
7497    MODE is the mode in which X should be interpreted.
7498
7499    DEST_REG is the putative biv, also the destination of the insn.
7500    We accept patterns of these forms:
7501      REG = REG + INVARIANT (includes REG = REG - CONSTANT)
7502      REG = INVARIANT + REG
7503
7504    If X is suitable, we return 1, set *MULT_VAL to CONST1_RTX,
7505    store the additive term into *INC_VAL, and store the place where
7506    we found the additive term into *LOCATION.
7507
7508    If X is an assignment of an invariant into DEST_REG, we set
7509    *MULT_VAL to CONST0_RTX, and store the invariant into *INC_VAL.
7510
7511    We also want to detect a BIV when it corresponds to a variable
7512    whose mode was promoted.  In that case, an increment
7513    of the variable may be a PLUS that adds a SUBREG of that variable to
7514    an invariant and then sign- or zero-extends the result of the PLUS
7515    into the variable.
7516
7517    Most GIVs in such cases will be in the promoted mode, since that is the
7518    probably the natural computation mode (and almost certainly the mode
7519    used for addresses) on the machine.  So we view the pseudo-reg containing
7520    the variable as the BIV, as if it were simply incremented.
7521
7522    Note that treating the entire pseudo as a BIV will result in making
7523    simple increments to any GIVs based on it.  However, if the variable
7524    overflows in its declared mode but not its promoted mode, the result will
7525    be incorrect.  This is acceptable if the variable is signed, since
7526    overflows in such cases are undefined, but not if it is unsigned, since
7527    those overflows are defined.  So we only check for SIGN_EXTEND and
7528    not ZERO_EXTEND.
7529
7530    If we cannot find a biv, we return 0.  */
7531
7532 static int
7533 basic_induction_var (const struct loop *loop, rtx x, enum machine_mode mode,
7534                      rtx dest_reg, rtx p, rtx *inc_val, rtx *mult_val,
7535                      rtx **location)
7536 {
7537   enum rtx_code code;
7538   rtx *argp, arg;
7539   rtx insn, set = 0, last, inc;
7540
7541   code = GET_CODE (x);
7542   *location = NULL;
7543   switch (code)
7544     {
7545     case PLUS:
7546       if (rtx_equal_p (XEXP (x, 0), dest_reg)
7547           || (GET_CODE (XEXP (x, 0)) == SUBREG
7548               && SUBREG_PROMOTED_VAR_P (XEXP (x, 0))
7549               && SUBREG_REG (XEXP (x, 0)) == dest_reg))
7550         {
7551           argp = &XEXP (x, 1);
7552         }
7553       else if (rtx_equal_p (XEXP (x, 1), dest_reg)
7554                || (GET_CODE (XEXP (x, 1)) == SUBREG
7555                    && SUBREG_PROMOTED_VAR_P (XEXP (x, 1))
7556                    && SUBREG_REG (XEXP (x, 1)) == dest_reg))
7557         {
7558           argp = &XEXP (x, 0);
7559         }
7560       else
7561         return 0;
7562
7563       arg = *argp;
7564       if (loop_invariant_p (loop, arg) != 1)
7565         return 0;
7566
7567       /* convert_modes can emit new instructions, e.g. when arg is a loop
7568          invariant MEM and dest_reg has a different mode.
7569          These instructions would be emitted after the end of the function
7570          and then *inc_val would be an uninitialized pseudo.
7571          Detect this and bail in this case.
7572          Other alternatives to solve this can be introducing a convert_modes
7573          variant which is allowed to fail but not allowed to emit new
7574          instructions, emit these instructions before loop start and let
7575          it be garbage collected if *inc_val is never used or saving the
7576          *inc_val initialization sequence generated here and when *inc_val
7577          is going to be actually used, emit it at some suitable place.  */
7578       last = get_last_insn ();
7579       inc = convert_modes (GET_MODE (dest_reg), GET_MODE (x), arg, 0);
7580       if (get_last_insn () != last)
7581         {
7582           delete_insns_since (last);
7583           return 0;
7584         }
7585
7586       *inc_val = inc;
7587       *mult_val = const1_rtx;
7588       *location = argp;
7589       return 1;
7590
7591     case SUBREG:
7592       /* If what's inside the SUBREG is a BIV, then the SUBREG.  This will
7593          handle addition of promoted variables.
7594          ??? The comment at the start of this function is wrong: promoted
7595          variable increments don't look like it says they do.  */
7596       return basic_induction_var (loop, SUBREG_REG (x),
7597                                   GET_MODE (SUBREG_REG (x)),
7598                                   dest_reg, p, inc_val, mult_val, location);
7599
7600     case REG:
7601       /* If this register is assigned in a previous insn, look at its
7602          source, but don't go outside the loop or past a label.  */
7603
7604       /* If this sets a register to itself, we would repeat any previous
7605          biv increment if we applied this strategy blindly.  */
7606       if (rtx_equal_p (dest_reg, x))
7607         return 0;
7608
7609       insn = p;
7610       while (1)
7611         {
7612           rtx dest;
7613           do
7614             {
7615               insn = PREV_INSN (insn);
7616             }
7617           while (insn && NOTE_P (insn)
7618                  && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
7619
7620           if (!insn)
7621             break;
7622           set = single_set (insn);
7623           if (set == 0)
7624             break;
7625           dest = SET_DEST (set);
7626           if (dest == x
7627               || (GET_CODE (dest) == SUBREG
7628                   && (GET_MODE_SIZE (GET_MODE (dest)) <= UNITS_PER_WORD)
7629                   && (GET_MODE_CLASS (GET_MODE (dest)) == MODE_INT)
7630                   && SUBREG_REG (dest) == x))
7631             return basic_induction_var (loop, SET_SRC (set),
7632                                         (GET_MODE (SET_SRC (set)) == VOIDmode
7633                                          ? GET_MODE (x)
7634                                          : GET_MODE (SET_SRC (set))),
7635                                         dest_reg, insn,
7636                                         inc_val, mult_val, location);
7637
7638           while (GET_CODE (dest) == SUBREG
7639                  || GET_CODE (dest) == ZERO_EXTRACT
7640                  || GET_CODE (dest) == STRICT_LOW_PART)
7641             dest = XEXP (dest, 0);
7642           if (dest == x)
7643             break;
7644         }
7645       /* Fall through.  */
7646
7647       /* Can accept constant setting of biv only when inside inner most loop.
7648          Otherwise, a biv of an inner loop may be incorrectly recognized
7649          as a biv of the outer loop,
7650          causing code to be moved INTO the inner loop.  */
7651     case MEM:
7652       if (loop_invariant_p (loop, x) != 1)
7653         return 0;
7654     case CONST_INT:
7655     case SYMBOL_REF:
7656     case CONST:
7657       /* convert_modes dies if we try to convert to or from CCmode, so just
7658          exclude that case.  It is very unlikely that a condition code value
7659          would be a useful iterator anyways.  convert_modes dies if we try to
7660          convert a float mode to non-float or vice versa too.  */
7661       if (loop->level == 1
7662           && GET_MODE_CLASS (mode) == GET_MODE_CLASS (GET_MODE (dest_reg))
7663           && GET_MODE_CLASS (mode) != MODE_CC)
7664         {
7665           /* Possible bug here?  Perhaps we don't know the mode of X.  */
7666           last = get_last_insn ();
7667           inc = convert_modes (GET_MODE (dest_reg), mode, x, 0);
7668           if (get_last_insn () != last)
7669             {
7670               delete_insns_since (last);
7671               return 0;
7672             }
7673
7674           *inc_val = inc;
7675           *mult_val = const0_rtx;
7676           return 1;
7677         }
7678       else
7679         return 0;
7680
7681     case SIGN_EXTEND:
7682       /* Ignore this BIV if signed arithmetic overflow is defined.  */
7683       if (flag_wrapv)
7684         return 0;
7685       return basic_induction_var (loop, XEXP (x, 0), GET_MODE (XEXP (x, 0)),
7686                                   dest_reg, p, inc_val, mult_val, location);
7687
7688     case ASHIFTRT:
7689       /* Similar, since this can be a sign extension.  */
7690       for (insn = PREV_INSN (p);
7691            (insn && NOTE_P (insn)
7692             && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
7693            insn = PREV_INSN (insn))
7694         ;
7695
7696       if (insn)
7697         set = single_set (insn);
7698
7699       if (! rtx_equal_p (dest_reg, XEXP (x, 0))
7700           && set && SET_DEST (set) == XEXP (x, 0)
7701           && GET_CODE (XEXP (x, 1)) == CONST_INT
7702           && INTVAL (XEXP (x, 1)) >= 0
7703           && GET_CODE (SET_SRC (set)) == ASHIFT
7704           && XEXP (x, 1) == XEXP (SET_SRC (set), 1))
7705         return basic_induction_var (loop, XEXP (SET_SRC (set), 0),
7706                                     GET_MODE (XEXP (x, 0)),
7707                                     dest_reg, insn, inc_val, mult_val,
7708                                     location);
7709       return 0;
7710
7711     default:
7712       return 0;
7713     }
7714 }
7715 \f
7716 /* A general induction variable (giv) is any quantity that is a linear
7717    function   of a basic induction variable,
7718    i.e. giv = biv * mult_val + add_val.
7719    The coefficients can be any loop invariant quantity.
7720    A giv need not be computed directly from the biv;
7721    it can be computed by way of other givs.  */
7722
7723 /* Determine whether X computes a giv.
7724    If it does, return a nonzero value
7725      which is the benefit from eliminating the computation of X;
7726    set *SRC_REG to the register of the biv that it is computed from;
7727    set *ADD_VAL and *MULT_VAL to the coefficients,
7728      such that the value of X is biv * mult + add;  */
7729
7730 static int
7731 general_induction_var (const struct loop *loop, rtx x, rtx *src_reg,
7732                        rtx *add_val, rtx *mult_val, rtx *ext_val,
7733                        int is_addr, int *pbenefit,
7734                        enum machine_mode addr_mode)
7735 {
7736   struct loop_ivs *ivs = LOOP_IVS (loop);
7737   rtx orig_x = x;
7738
7739   /* If this is an invariant, forget it, it isn't a giv.  */
7740   if (loop_invariant_p (loop, x) == 1)
7741     return 0;
7742
7743   *pbenefit = 0;
7744   *ext_val = NULL_RTX;
7745   x = simplify_giv_expr (loop, x, ext_val, pbenefit);
7746   if (x == 0)
7747     return 0;
7748
7749   switch (GET_CODE (x))
7750     {
7751     case USE:
7752     case CONST_INT:
7753       /* Since this is now an invariant and wasn't before, it must be a giv
7754          with MULT_VAL == 0.  It doesn't matter which BIV we associate this
7755          with.  */
7756       *src_reg = ivs->list->biv->dest_reg;
7757       *mult_val = const0_rtx;
7758       *add_val = x;
7759       break;
7760
7761     case REG:
7762       /* This is equivalent to a BIV.  */
7763       *src_reg = x;
7764       *mult_val = const1_rtx;
7765       *add_val = const0_rtx;
7766       break;
7767
7768     case PLUS:
7769       /* Either (plus (biv) (invar)) or
7770          (plus (mult (biv) (invar_1)) (invar_2)).  */
7771       if (GET_CODE (XEXP (x, 0)) == MULT)
7772         {
7773           *src_reg = XEXP (XEXP (x, 0), 0);
7774           *mult_val = XEXP (XEXP (x, 0), 1);
7775         }
7776       else
7777         {
7778           *src_reg = XEXP (x, 0);
7779           *mult_val = const1_rtx;
7780         }
7781       *add_val = XEXP (x, 1);
7782       break;
7783
7784     case MULT:
7785       /* ADD_VAL is zero.  */
7786       *src_reg = XEXP (x, 0);
7787       *mult_val = XEXP (x, 1);
7788       *add_val = const0_rtx;
7789       break;
7790
7791     default:
7792       gcc_unreachable ();
7793     }
7794
7795   /* Remove any enclosing USE from ADD_VAL and MULT_VAL (there will be
7796      unless they are CONST_INT).  */
7797   if (GET_CODE (*add_val) == USE)
7798     *add_val = XEXP (*add_val, 0);
7799   if (GET_CODE (*mult_val) == USE)
7800     *mult_val = XEXP (*mult_val, 0);
7801
7802   if (is_addr)
7803     *pbenefit += address_cost (orig_x, addr_mode) - reg_address_cost;
7804   else
7805     *pbenefit += rtx_cost (orig_x, SET);
7806
7807   /* Always return true if this is a giv so it will be detected as such,
7808      even if the benefit is zero or negative.  This allows elimination
7809      of bivs that might otherwise not be eliminated.  */
7810   return 1;
7811 }
7812 \f
7813 /* Given an expression, X, try to form it as a linear function of a biv.
7814    We will canonicalize it to be of the form
7815         (plus (mult (BIV) (invar_1))
7816               (invar_2))
7817    with possible degeneracies.
7818
7819    The invariant expressions must each be of a form that can be used as a
7820    machine operand.  We surround then with a USE rtx (a hack, but localized
7821    and certainly unambiguous!) if not a CONST_INT for simplicity in this
7822    routine; it is the caller's responsibility to strip them.
7823
7824    If no such canonicalization is possible (i.e., two biv's are used or an
7825    expression that is neither invariant nor a biv or giv), this routine
7826    returns 0.
7827
7828    For a nonzero return, the result will have a code of CONST_INT, USE,
7829    REG (for a BIV), PLUS, or MULT.  No other codes will occur.
7830
7831    *BENEFIT will be incremented by the benefit of any sub-giv encountered.  */
7832
7833 static rtx sge_plus (enum machine_mode, rtx, rtx);
7834 static rtx sge_plus_constant (rtx, rtx);
7835
7836 static rtx
7837 simplify_giv_expr (const struct loop *loop, rtx x, rtx *ext_val, int *benefit)
7838 {
7839   struct loop_ivs *ivs = LOOP_IVS (loop);
7840   struct loop_regs *regs = LOOP_REGS (loop);
7841   enum machine_mode mode = GET_MODE (x);
7842   rtx arg0, arg1;
7843   rtx tem;
7844
7845   /* If this is not an integer mode, or if we cannot do arithmetic in this
7846      mode, this can't be a giv.  */
7847   if (mode != VOIDmode
7848       && (GET_MODE_CLASS (mode) != MODE_INT
7849           || GET_MODE_BITSIZE (mode) > HOST_BITS_PER_WIDE_INT))
7850     return NULL_RTX;
7851
7852   switch (GET_CODE (x))
7853     {
7854     case PLUS:
7855       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
7856       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
7857       if (arg0 == 0 || arg1 == 0)
7858         return NULL_RTX;
7859
7860       /* Put constant last, CONST_INT last if both constant.  */
7861       if ((GET_CODE (arg0) == USE
7862            || GET_CODE (arg0) == CONST_INT)
7863           && ! ((GET_CODE (arg0) == USE
7864                  && GET_CODE (arg1) == USE)
7865                 || GET_CODE (arg1) == CONST_INT))
7866         tem = arg0, arg0 = arg1, arg1 = tem;
7867
7868       /* Handle addition of zero, then addition of an invariant.  */
7869       if (arg1 == const0_rtx)
7870         return arg0;
7871       else if (GET_CODE (arg1) == CONST_INT || GET_CODE (arg1) == USE)
7872         switch (GET_CODE (arg0))
7873           {
7874           case CONST_INT:
7875           case USE:
7876             /* Adding two invariants must result in an invariant, so enclose
7877                addition operation inside a USE and return it.  */
7878             if (GET_CODE (arg0) == USE)
7879               arg0 = XEXP (arg0, 0);
7880             if (GET_CODE (arg1) == USE)
7881               arg1 = XEXP (arg1, 0);
7882
7883             if (GET_CODE (arg0) == CONST_INT)
7884               tem = arg0, arg0 = arg1, arg1 = tem;
7885             if (GET_CODE (arg1) == CONST_INT)
7886               tem = sge_plus_constant (arg0, arg1);
7887             else
7888               tem = sge_plus (mode, arg0, arg1);
7889
7890             if (GET_CODE (tem) != CONST_INT)
7891               tem = gen_rtx_USE (mode, tem);
7892             return tem;
7893
7894           case REG:
7895           case MULT:
7896             /* biv + invar or mult + invar.  Return sum.  */
7897             return gen_rtx_PLUS (mode, arg0, arg1);
7898
7899           case PLUS:
7900             /* (a + invar_1) + invar_2.  Associate.  */
7901             return
7902               simplify_giv_expr (loop,
7903                                  gen_rtx_PLUS (mode,
7904                                                XEXP (arg0, 0),
7905                                                gen_rtx_PLUS (mode,
7906                                                              XEXP (arg0, 1),
7907                                                              arg1)),
7908                                  ext_val, benefit);
7909
7910           default:
7911             gcc_unreachable ();
7912           }
7913
7914       /* Each argument must be either REG, PLUS, or MULT.  Convert REG to
7915          MULT to reduce cases.  */
7916       if (REG_P (arg0))
7917         arg0 = gen_rtx_MULT (mode, arg0, const1_rtx);
7918       if (REG_P (arg1))
7919         arg1 = gen_rtx_MULT (mode, arg1, const1_rtx);
7920
7921       /* Now have PLUS + PLUS, PLUS + MULT, MULT + PLUS, or MULT + MULT.
7922          Put a MULT first, leaving PLUS + PLUS, MULT + PLUS, or MULT + MULT.
7923          Recurse to associate the second PLUS.  */
7924       if (GET_CODE (arg1) == MULT)
7925         tem = arg0, arg0 = arg1, arg1 = tem;
7926
7927       if (GET_CODE (arg1) == PLUS)
7928         return
7929           simplify_giv_expr (loop,
7930                              gen_rtx_PLUS (mode,
7931                                            gen_rtx_PLUS (mode, arg0,
7932                                                          XEXP (arg1, 0)),
7933                                            XEXP (arg1, 1)),
7934                              ext_val, benefit);
7935
7936       /* Now must have MULT + MULT.  Distribute if same biv, else not giv.  */
7937       if (GET_CODE (arg0) != MULT || GET_CODE (arg1) != MULT)
7938         return NULL_RTX;
7939
7940       if (!rtx_equal_p (arg0, arg1))
7941         return NULL_RTX;
7942
7943       return simplify_giv_expr (loop,
7944                                 gen_rtx_MULT (mode,
7945                                               XEXP (arg0, 0),
7946                                               gen_rtx_PLUS (mode,
7947                                                             XEXP (arg0, 1),
7948                                                             XEXP (arg1, 1))),
7949                                 ext_val, benefit);
7950
7951     case MINUS:
7952       /* Handle "a - b" as "a + b * (-1)".  */
7953       return simplify_giv_expr (loop,
7954                                 gen_rtx_PLUS (mode,
7955                                               XEXP (x, 0),
7956                                               gen_rtx_MULT (mode,
7957                                                             XEXP (x, 1),
7958                                                             constm1_rtx)),
7959                                 ext_val, benefit);
7960
7961     case MULT:
7962       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
7963       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
7964       if (arg0 == 0 || arg1 == 0)
7965         return NULL_RTX;
7966
7967       /* Put constant last, CONST_INT last if both constant.  */
7968       if ((GET_CODE (arg0) == USE || GET_CODE (arg0) == CONST_INT)
7969           && GET_CODE (arg1) != CONST_INT)
7970         tem = arg0, arg0 = arg1, arg1 = tem;
7971
7972       /* If second argument is not now constant, not giv.  */
7973       if (GET_CODE (arg1) != USE && GET_CODE (arg1) != CONST_INT)
7974         return NULL_RTX;
7975
7976       /* Handle multiply by 0 or 1.  */
7977       if (arg1 == const0_rtx)
7978         return const0_rtx;
7979
7980       else if (arg1 == const1_rtx)
7981         return arg0;
7982
7983       switch (GET_CODE (arg0))
7984         {
7985         case REG:
7986           /* biv * invar.  Done.  */
7987           return gen_rtx_MULT (mode, arg0, arg1);
7988
7989         case CONST_INT:
7990           /* Product of two constants.  */
7991           return GEN_INT (INTVAL (arg0) * INTVAL (arg1));
7992
7993         case USE:
7994           /* invar * invar is a giv, but attempt to simplify it somehow.  */
7995           if (GET_CODE (arg1) != CONST_INT)
7996             return NULL_RTX;
7997
7998           arg0 = XEXP (arg0, 0);
7999           if (GET_CODE (arg0) == MULT)
8000             {
8001               /* (invar_0 * invar_1) * invar_2.  Associate.  */
8002               return simplify_giv_expr (loop,
8003                                         gen_rtx_MULT (mode,
8004                                                       XEXP (arg0, 0),
8005                                                       gen_rtx_MULT (mode,
8006                                                                     XEXP (arg0,
8007                                                                           1),
8008                                                                     arg1)),
8009                                         ext_val, benefit);
8010             }
8011           /* Propagate the MULT expressions to the innermost nodes.  */
8012           else if (GET_CODE (arg0) == PLUS)
8013             {
8014               /* (invar_0 + invar_1) * invar_2.  Distribute.  */
8015               return simplify_giv_expr (loop,
8016                                         gen_rtx_PLUS (mode,
8017                                                       gen_rtx_MULT (mode,
8018                                                                     XEXP (arg0,
8019                                                                           0),
8020                                                                     arg1),
8021                                                       gen_rtx_MULT (mode,
8022                                                                     XEXP (arg0,
8023                                                                           1),
8024                                                                     arg1)),
8025                                         ext_val, benefit);
8026             }
8027           return gen_rtx_USE (mode, gen_rtx_MULT (mode, arg0, arg1));
8028
8029         case MULT:
8030           /* (a * invar_1) * invar_2.  Associate.  */
8031           return simplify_giv_expr (loop,
8032                                     gen_rtx_MULT (mode,
8033                                                   XEXP (arg0, 0),
8034                                                   gen_rtx_MULT (mode,
8035                                                                 XEXP (arg0, 1),
8036                                                                 arg1)),
8037                                     ext_val, benefit);
8038
8039         case PLUS:
8040           /* (a + invar_1) * invar_2.  Distribute.  */
8041           return simplify_giv_expr (loop,
8042                                     gen_rtx_PLUS (mode,
8043                                                   gen_rtx_MULT (mode,
8044                                                                 XEXP (arg0, 0),
8045                                                                 arg1),
8046                                                   gen_rtx_MULT (mode,
8047                                                                 XEXP (arg0, 1),
8048                                                                 arg1)),
8049                                     ext_val, benefit);
8050
8051         default:
8052           gcc_unreachable ();
8053         }
8054
8055     case ASHIFT:
8056       /* Shift by constant is multiply by power of two.  */
8057       if (GET_CODE (XEXP (x, 1)) != CONST_INT)
8058         return 0;
8059
8060       return
8061         simplify_giv_expr (loop,
8062                            gen_rtx_MULT (mode,
8063                                          XEXP (x, 0),
8064                                          GEN_INT ((HOST_WIDE_INT) 1
8065                                                   << INTVAL (XEXP (x, 1)))),
8066                            ext_val, benefit);
8067
8068     case NEG:
8069       /* "-a" is "a * (-1)" */
8070       return simplify_giv_expr (loop,
8071                                 gen_rtx_MULT (mode, XEXP (x, 0), constm1_rtx),
8072                                 ext_val, benefit);
8073
8074     case NOT:
8075       /* "~a" is "-a - 1". Silly, but easy.  */
8076       return simplify_giv_expr (loop,
8077                                 gen_rtx_MINUS (mode,
8078                                                gen_rtx_NEG (mode, XEXP (x, 0)),
8079                                                const1_rtx),
8080                                 ext_val, benefit);
8081
8082     case USE:
8083       /* Already in proper form for invariant.  */
8084       return x;
8085
8086     case SIGN_EXTEND:
8087     case ZERO_EXTEND:
8088     case TRUNCATE:
8089       /* Conditionally recognize extensions of simple IVs.  After we've
8090          computed loop traversal counts and verified the range of the
8091          source IV, we'll reevaluate this as a GIV.  */
8092       if (*ext_val == NULL_RTX)
8093         {
8094           arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
8095           if (arg0 && *ext_val == NULL_RTX && REG_P (arg0))
8096             {
8097               *ext_val = gen_rtx_fmt_e (GET_CODE (x), mode, arg0);
8098               return arg0;
8099             }
8100         }
8101       goto do_default;
8102
8103     case REG:
8104       /* If this is a new register, we can't deal with it.  */
8105       if (REGNO (x) >= max_reg_before_loop)
8106         return 0;
8107
8108       /* Check for biv or giv.  */
8109       switch (REG_IV_TYPE (ivs, REGNO (x)))
8110         {
8111         case BASIC_INDUCT:
8112           return x;
8113         case GENERAL_INDUCT:
8114           {
8115             struct induction *v = REG_IV_INFO (ivs, REGNO (x));
8116
8117             /* Form expression from giv and add benefit.  Ensure this giv
8118                can derive another and subtract any needed adjustment if so.  */
8119
8120             /* Increasing the benefit here is risky.  The only case in which it
8121                is arguably correct is if this is the only use of V.  In other
8122                cases, this will artificially inflate the benefit of the current
8123                giv, and lead to suboptimal code.  Thus, it is disabled, since
8124                potentially not reducing an only marginally beneficial giv is
8125                less harmful than reducing many givs that are not really
8126                beneficial.  */
8127             {
8128               rtx single_use = regs->array[REGNO (x)].single_usage;
8129               if (single_use && single_use != const0_rtx)
8130                 *benefit += v->benefit;
8131             }
8132
8133             if (v->cant_derive)
8134               return 0;
8135
8136             tem = gen_rtx_PLUS (mode, gen_rtx_MULT (mode,
8137                                                     v->src_reg, v->mult_val),
8138                                 v->add_val);
8139
8140             if (v->derive_adjustment)
8141               tem = gen_rtx_MINUS (mode, tem, v->derive_adjustment);
8142             arg0 = simplify_giv_expr (loop, tem, ext_val, benefit);
8143             if (*ext_val)
8144               {
8145                 if (!v->ext_dependent)
8146                   return arg0;
8147               }
8148             else
8149               {
8150                 *ext_val = v->ext_dependent;
8151                 return arg0;
8152               }
8153             return 0;
8154           }
8155
8156         default:
8157         do_default:
8158           /* If it isn't an induction variable, and it is invariant, we
8159              may be able to simplify things further by looking through
8160              the bits we just moved outside the loop.  */
8161           if (loop_invariant_p (loop, x) == 1)
8162             {
8163               struct movable *m;
8164               struct loop_movables *movables = LOOP_MOVABLES (loop);
8165
8166               for (m = movables->head; m; m = m->next)
8167                 if (rtx_equal_p (x, m->set_dest))
8168                   {
8169                     /* Ok, we found a match.  Substitute and simplify.  */
8170
8171                     /* If we match another movable, we must use that, as
8172                        this one is going away.  */
8173                     if (m->match)
8174                       return simplify_giv_expr (loop, m->match->set_dest,
8175                                                 ext_val, benefit);
8176
8177                     /* If consec is nonzero, this is a member of a group of
8178                        instructions that were moved together.  We handle this
8179                        case only to the point of seeking to the last insn and
8180                        looking for a REG_EQUAL.  Fail if we don't find one.  */
8181                     if (m->consec != 0)
8182                       {
8183                         int i = m->consec;
8184                         tem = m->insn;
8185                         do
8186                           {
8187                             tem = NEXT_INSN (tem);
8188                           }
8189                         while (--i > 0);
8190
8191                         tem = find_reg_note (tem, REG_EQUAL, NULL_RTX);
8192                         if (tem)
8193                           tem = XEXP (tem, 0);
8194                       }
8195                     else
8196                       {
8197                         tem = single_set (m->insn);
8198                         if (tem)
8199                           tem = SET_SRC (tem);
8200                       }
8201
8202                     if (tem)
8203                       {
8204                         /* What we are most interested in is pointer
8205                            arithmetic on invariants -- only take
8206                            patterns we may be able to do something with.  */
8207                         if (GET_CODE (tem) == PLUS
8208                             || GET_CODE (tem) == MULT
8209                             || GET_CODE (tem) == ASHIFT
8210                             || GET_CODE (tem) == CONST_INT
8211                             || GET_CODE (tem) == SYMBOL_REF)
8212                           {
8213                             tem = simplify_giv_expr (loop, tem, ext_val,
8214                                                      benefit);
8215                             if (tem)
8216                               return tem;
8217                           }
8218                         else if (GET_CODE (tem) == CONST
8219                                  && GET_CODE (XEXP (tem, 0)) == PLUS
8220                                  && GET_CODE (XEXP (XEXP (tem, 0), 0)) == SYMBOL_REF
8221                                  && GET_CODE (XEXP (XEXP (tem, 0), 1)) == CONST_INT)
8222                           {
8223                             tem = simplify_giv_expr (loop, XEXP (tem, 0),
8224                                                      ext_val, benefit);
8225                             if (tem)
8226                               return tem;
8227                           }
8228                       }
8229                     break;
8230                   }
8231             }
8232           break;
8233         }
8234
8235       /* Fall through to general case.  */
8236     default:
8237       /* If invariant, return as USE (unless CONST_INT).
8238          Otherwise, not giv.  */
8239       if (GET_CODE (x) == USE)
8240         x = XEXP (x, 0);
8241
8242       if (loop_invariant_p (loop, x) == 1)
8243         {
8244           if (GET_CODE (x) == CONST_INT)
8245             return x;
8246           if (GET_CODE (x) == CONST
8247               && GET_CODE (XEXP (x, 0)) == PLUS
8248               && GET_CODE (XEXP (XEXP (x, 0), 0)) == SYMBOL_REF
8249               && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT)
8250             x = XEXP (x, 0);
8251           return gen_rtx_USE (mode, x);
8252         }
8253       else
8254         return 0;
8255     }
8256 }
8257
8258 /* This routine folds invariants such that there is only ever one
8259    CONST_INT in the summation.  It is only used by simplify_giv_expr.  */
8260
8261 static rtx
8262 sge_plus_constant (rtx x, rtx c)
8263 {
8264   if (GET_CODE (x) == CONST_INT)
8265     return GEN_INT (INTVAL (x) + INTVAL (c));
8266   else if (GET_CODE (x) != PLUS)
8267     return gen_rtx_PLUS (GET_MODE (x), x, c);
8268   else if (GET_CODE (XEXP (x, 1)) == CONST_INT)
8269     {
8270       return gen_rtx_PLUS (GET_MODE (x), XEXP (x, 0),
8271                            GEN_INT (INTVAL (XEXP (x, 1)) + INTVAL (c)));
8272     }
8273   else if (GET_CODE (XEXP (x, 0)) == PLUS
8274            || GET_CODE (XEXP (x, 1)) != PLUS)
8275     {
8276       return gen_rtx_PLUS (GET_MODE (x),
8277                            sge_plus_constant (XEXP (x, 0), c), XEXP (x, 1));
8278     }
8279   else
8280     {
8281       return gen_rtx_PLUS (GET_MODE (x),
8282                            sge_plus_constant (XEXP (x, 1), c), XEXP (x, 0));
8283     }
8284 }
8285
8286 static rtx
8287 sge_plus (enum machine_mode mode, rtx x, rtx y)
8288 {
8289   while (GET_CODE (y) == PLUS)
8290     {
8291       rtx a = XEXP (y, 0);
8292       if (GET_CODE (a) == CONST_INT)
8293         x = sge_plus_constant (x, a);
8294       else
8295         x = gen_rtx_PLUS (mode, x, a);
8296       y = XEXP (y, 1);
8297     }
8298   if (GET_CODE (y) == CONST_INT)
8299     x = sge_plus_constant (x, y);
8300   else
8301     x = gen_rtx_PLUS (mode, x, y);
8302   return x;
8303 }
8304 \f
8305 /* Help detect a giv that is calculated by several consecutive insns;
8306    for example,
8307       giv = biv * M
8308       giv = giv + A
8309    The caller has already identified the first insn P as having a giv as dest;
8310    we check that all other insns that set the same register follow
8311    immediately after P, that they alter nothing else,
8312    and that the result of the last is still a giv.
8313
8314    The value is 0 if the reg set in P is not really a giv.
8315    Otherwise, the value is the amount gained by eliminating
8316    all the consecutive insns that compute the value.
8317
8318    FIRST_BENEFIT is the amount gained by eliminating the first insn, P.
8319    SRC_REG is the reg of the biv; DEST_REG is the reg of the giv.
8320
8321    The coefficients of the ultimate giv value are stored in
8322    *MULT_VAL and *ADD_VAL.  */
8323
8324 static int
8325 consec_sets_giv (const struct loop *loop, int first_benefit, rtx p,
8326                  rtx src_reg, rtx dest_reg, rtx *add_val, rtx *mult_val,
8327                  rtx *ext_val, rtx *last_consec_insn)
8328 {
8329   struct loop_ivs *ivs = LOOP_IVS (loop);
8330   struct loop_regs *regs = LOOP_REGS (loop);
8331   int count;
8332   enum rtx_code code;
8333   int benefit;
8334   rtx temp;
8335   rtx set;
8336
8337   /* Indicate that this is a giv so that we can update the value produced in
8338      each insn of the multi-insn sequence.
8339
8340      This induction structure will be used only by the call to
8341      general_induction_var below, so we can allocate it on our stack.
8342      If this is a giv, our caller will replace the induct var entry with
8343      a new induction structure.  */
8344   struct induction *v;
8345
8346   if (REG_IV_TYPE (ivs, REGNO (dest_reg)) != UNKNOWN_INDUCT)
8347     return 0;
8348
8349   v = alloca (sizeof (struct induction));
8350   v->src_reg = src_reg;
8351   v->mult_val = *mult_val;
8352   v->add_val = *add_val;
8353   v->benefit = first_benefit;
8354   v->cant_derive = 0;
8355   v->derive_adjustment = 0;
8356   v->ext_dependent = NULL_RTX;
8357
8358   REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
8359   REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
8360
8361   count = regs->array[REGNO (dest_reg)].n_times_set - 1;
8362
8363   while (count > 0)
8364     {
8365       p = NEXT_INSN (p);
8366       code = GET_CODE (p);
8367
8368       /* If libcall, skip to end of call sequence.  */
8369       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
8370         p = XEXP (temp, 0);
8371
8372       if (code == INSN
8373           && (set = single_set (p))
8374           && REG_P (SET_DEST (set))
8375           && SET_DEST (set) == dest_reg
8376           && (general_induction_var (loop, SET_SRC (set), &src_reg,
8377                                      add_val, mult_val, ext_val, 0,
8378                                      &benefit, VOIDmode)
8379               /* Giv created by equivalent expression.  */
8380               || ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX))
8381                   && general_induction_var (loop, XEXP (temp, 0), &src_reg,
8382                                             add_val, mult_val, ext_val, 0,
8383                                             &benefit, VOIDmode)))
8384           && src_reg == v->src_reg)
8385         {
8386           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
8387             benefit += libcall_benefit (p);
8388
8389           count--;
8390           v->mult_val = *mult_val;
8391           v->add_val = *add_val;
8392           v->benefit += benefit;
8393         }
8394       else if (code != NOTE)
8395         {
8396           /* Allow insns that set something other than this giv to a
8397              constant.  Such insns are needed on machines which cannot
8398              include long constants and should not disqualify a giv.  */
8399           if (code == INSN
8400               && (set = single_set (p))
8401               && SET_DEST (set) != dest_reg
8402               && CONSTANT_P (SET_SRC (set)))
8403             continue;
8404
8405           REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
8406           return 0;
8407         }
8408     }
8409
8410   REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
8411   *last_consec_insn = p;
8412   return v->benefit;
8413 }
8414 \f
8415 /* Return an rtx, if any, that expresses giv G2 as a function of the register
8416    represented by G1.  If no such expression can be found, or it is clear that
8417    it cannot possibly be a valid address, 0 is returned.
8418
8419    To perform the computation, we note that
8420         G1 = x * v + a          and
8421         G2 = y * v + b
8422    where `v' is the biv.
8423
8424    So G2 = (y/b) * G1 + (b - a*y/x).
8425
8426    Note that MULT = y/x.
8427
8428    Update: A and B are now allowed to be additive expressions such that
8429    B contains all variables in A.  That is, computing B-A will not require
8430    subtracting variables.  */
8431
8432 static rtx
8433 express_from_1 (rtx a, rtx b, rtx mult)
8434 {
8435   /* If MULT is zero, then A*MULT is zero, and our expression is B.  */
8436
8437   if (mult == const0_rtx)
8438     return b;
8439
8440   /* If MULT is not 1, we cannot handle A with non-constants, since we
8441      would then be required to subtract multiples of the registers in A.
8442      This is theoretically possible, and may even apply to some Fortran
8443      constructs, but it is a lot of work and we do not attempt it here.  */
8444
8445   if (mult != const1_rtx && GET_CODE (a) != CONST_INT)
8446     return NULL_RTX;
8447
8448   /* In general these structures are sorted top to bottom (down the PLUS
8449      chain), but not left to right across the PLUS.  If B is a higher
8450      order giv than A, we can strip one level and recurse.  If A is higher
8451      order, we'll eventually bail out, but won't know that until the end.
8452      If they are the same, we'll strip one level around this loop.  */
8453
8454   while (GET_CODE (a) == PLUS && GET_CODE (b) == PLUS)
8455     {
8456       rtx ra, rb, oa, ob, tmp;
8457
8458       ra = XEXP (a, 0), oa = XEXP (a, 1);
8459       if (GET_CODE (ra) == PLUS)
8460         tmp = ra, ra = oa, oa = tmp;
8461
8462       rb = XEXP (b, 0), ob = XEXP (b, 1);
8463       if (GET_CODE (rb) == PLUS)
8464         tmp = rb, rb = ob, ob = tmp;
8465
8466       if (rtx_equal_p (ra, rb))
8467         /* We matched: remove one reg completely.  */
8468         a = oa, b = ob;
8469       else if (GET_CODE (ob) != PLUS && rtx_equal_p (ra, ob))
8470         /* An alternate match.  */
8471         a = oa, b = rb;
8472       else if (GET_CODE (oa) != PLUS && rtx_equal_p (oa, rb))
8473         /* An alternate match.  */
8474         a = ra, b = ob;
8475       else
8476         {
8477           /* Indicates an extra register in B.  Strip one level from B and
8478              recurse, hoping B was the higher order expression.  */
8479           ob = express_from_1 (a, ob, mult);
8480           if (ob == NULL_RTX)
8481             return NULL_RTX;
8482           return gen_rtx_PLUS (GET_MODE (b), rb, ob);
8483         }
8484     }
8485
8486   /* Here we are at the last level of A, go through the cases hoping to
8487      get rid of everything but a constant.  */
8488
8489   if (GET_CODE (a) == PLUS)
8490     {
8491       rtx ra, oa;
8492
8493       ra = XEXP (a, 0), oa = XEXP (a, 1);
8494       if (rtx_equal_p (oa, b))
8495         oa = ra;
8496       else if (!rtx_equal_p (ra, b))
8497         return NULL_RTX;
8498
8499       if (GET_CODE (oa) != CONST_INT)
8500         return NULL_RTX;
8501
8502       return GEN_INT (-INTVAL (oa) * INTVAL (mult));
8503     }
8504   else if (GET_CODE (a) == CONST_INT)
8505     {
8506       return plus_constant (b, -INTVAL (a) * INTVAL (mult));
8507     }
8508   else if (CONSTANT_P (a))
8509     {
8510       enum machine_mode mode_a = GET_MODE (a);
8511       enum machine_mode mode_b = GET_MODE (b);
8512       enum machine_mode mode = mode_b == VOIDmode ? mode_a : mode_b;
8513       return simplify_gen_binary (MINUS, mode, b, a);
8514     }
8515   else if (GET_CODE (b) == PLUS)
8516     {
8517       if (rtx_equal_p (a, XEXP (b, 0)))
8518         return XEXP (b, 1);
8519       else if (rtx_equal_p (a, XEXP (b, 1)))
8520         return XEXP (b, 0);
8521       else
8522         return NULL_RTX;
8523     }
8524   else if (rtx_equal_p (a, b))
8525     return const0_rtx;
8526
8527   return NULL_RTX;
8528 }
8529
8530 static rtx
8531 express_from (struct induction *g1, struct induction *g2)
8532 {
8533   rtx mult, add;
8534
8535   /* The value that G1 will be multiplied by must be a constant integer.  Also,
8536      the only chance we have of getting a valid address is if b*c/a (see above
8537      for notation) is also an integer.  */
8538   if (GET_CODE (g1->mult_val) == CONST_INT
8539       && GET_CODE (g2->mult_val) == CONST_INT)
8540     {
8541       if (g1->mult_val == const0_rtx
8542           || (g1->mult_val == constm1_rtx
8543               && INTVAL (g2->mult_val)
8544                  == (HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT - 1))
8545           || INTVAL (g2->mult_val) % INTVAL (g1->mult_val) != 0)
8546         return NULL_RTX;
8547       mult = GEN_INT (INTVAL (g2->mult_val) / INTVAL (g1->mult_val));
8548     }
8549   else if (rtx_equal_p (g1->mult_val, g2->mult_val))
8550     mult = const1_rtx;
8551   else
8552     {
8553       /* ??? Find out if the one is a multiple of the other?  */
8554       return NULL_RTX;
8555     }
8556
8557   add = express_from_1 (g1->add_val, g2->add_val, mult);
8558   if (add == NULL_RTX)
8559     {
8560       /* Failed.  If we've got a multiplication factor between G1 and G2,
8561          scale G1's addend and try again.  */
8562       if (INTVAL (mult) > 1)
8563         {
8564           rtx g1_add_val = g1->add_val;
8565           if (GET_CODE (g1_add_val) == MULT
8566               && GET_CODE (XEXP (g1_add_val, 1)) == CONST_INT)
8567             {
8568               HOST_WIDE_INT m;
8569               m = INTVAL (mult) * INTVAL (XEXP (g1_add_val, 1));
8570               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val),
8571                                          XEXP (g1_add_val, 0), GEN_INT (m));
8572             }
8573           else
8574             {
8575               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val), g1_add_val,
8576                                          mult);
8577             }
8578
8579           add = express_from_1 (g1_add_val, g2->add_val, const1_rtx);
8580         }
8581     }
8582   if (add == NULL_RTX)
8583     return NULL_RTX;
8584
8585   /* Form simplified final result.  */
8586   if (mult == const0_rtx)
8587     return add;
8588   else if (mult == const1_rtx)
8589     mult = g1->dest_reg;
8590   else
8591     mult = gen_rtx_MULT (g2->mode, g1->dest_reg, mult);
8592
8593   if (add == const0_rtx)
8594     return mult;
8595   else
8596     {
8597       if (GET_CODE (add) == PLUS
8598           && CONSTANT_P (XEXP (add, 1)))
8599         {
8600           rtx tem = XEXP (add, 1);
8601           mult = gen_rtx_PLUS (g2->mode, mult, XEXP (add, 0));
8602           add = tem;
8603         }
8604
8605       return gen_rtx_PLUS (g2->mode, mult, add);
8606     }
8607 }
8608 \f
8609 /* Return an rtx, if any, that expresses giv G2 as a function of the register
8610    represented by G1.  This indicates that G2 should be combined with G1 and
8611    that G2 can use (either directly or via an address expression) a register
8612    used to represent G1.  */
8613
8614 static rtx
8615 combine_givs_p (struct induction *g1, struct induction *g2)
8616 {
8617   rtx comb, ret;
8618
8619   /* With the introduction of ext dependent givs, we must care for modes.
8620      G2 must not use a wider mode than G1.  */
8621   if (GET_MODE_SIZE (g1->mode) < GET_MODE_SIZE (g2->mode))
8622     return NULL_RTX;
8623
8624   ret = comb = express_from (g1, g2);
8625   if (comb == NULL_RTX)
8626     return NULL_RTX;
8627   if (g1->mode != g2->mode)
8628     ret = gen_lowpart (g2->mode, comb);
8629
8630   /* If these givs are identical, they can be combined.  We use the results
8631      of express_from because the addends are not in a canonical form, so
8632      rtx_equal_p is a weaker test.  */
8633   /* But don't combine a DEST_REG giv with a DEST_ADDR giv; we want the
8634      combination to be the other way round.  */
8635   if (comb == g1->dest_reg
8636       && (g1->giv_type == DEST_REG || g2->giv_type == DEST_ADDR))
8637     {
8638       return ret;
8639     }
8640
8641   /* If G2 can be expressed as a function of G1 and that function is valid
8642      as an address and no more expensive than using a register for G2,
8643      the expression of G2 in terms of G1 can be used.  */
8644   if (ret != NULL_RTX
8645       && g2->giv_type == DEST_ADDR
8646       && memory_address_p (GET_MODE (g2->mem), ret))
8647     return ret;
8648
8649   return NULL_RTX;
8650 }
8651 \f
8652 /* See if BL is monotonic and has a constant per-iteration increment.
8653    Return the increment if so, otherwise return 0.  */
8654
8655 static HOST_WIDE_INT
8656 get_monotonic_increment (struct iv_class *bl)
8657 {
8658   struct induction *v;
8659   rtx incr;
8660
8661   /* Get the total increment and check that it is constant.  */
8662   incr = biv_total_increment (bl);
8663   if (incr == 0 || GET_CODE (incr) != CONST_INT)
8664     return 0;
8665
8666   for (v = bl->biv; v != 0; v = v->next_iv)
8667     {
8668       if (GET_CODE (v->add_val) != CONST_INT)
8669         return 0;
8670
8671       if (INTVAL (v->add_val) < 0 && INTVAL (incr) >= 0)
8672         return 0;
8673
8674       if (INTVAL (v->add_val) > 0 && INTVAL (incr) <= 0)
8675         return 0;
8676     }
8677   return INTVAL (incr);
8678 }
8679
8680
8681 /* Subroutine of biv_fits_mode_p.  Return true if biv BL, when biased by
8682    BIAS, will never exceed the unsigned range of MODE.  LOOP is the loop
8683    to which the biv belongs and INCR is its per-iteration increment.  */
8684
8685 static bool
8686 biased_biv_fits_mode_p (const struct loop *loop, struct iv_class *bl,
8687                         HOST_WIDE_INT incr, enum machine_mode mode,
8688                         unsigned HOST_WIDE_INT bias)
8689 {
8690   unsigned HOST_WIDE_INT initial, maximum, span, delta;
8691
8692   /* We need to be able to manipulate MODE-size constants.  */
8693   if (HOST_BITS_PER_WIDE_INT < GET_MODE_BITSIZE (mode))
8694     return false;
8695
8696   /* The number of loop iterations must be constant.  */
8697   if (LOOP_INFO (loop)->n_iterations == 0)
8698     return false;
8699
8700   /* So must the biv's initial value.  */
8701   if (bl->initial_value == 0 || GET_CODE (bl->initial_value) != CONST_INT)
8702     return false;
8703
8704   initial = bias + INTVAL (bl->initial_value);
8705   maximum = GET_MODE_MASK (mode);
8706
8707   /* Make sure that the initial value is within range.  */
8708   if (initial > maximum)
8709     return false;
8710
8711   /* Set up DELTA and SPAN such that the number of iterations * DELTA
8712      (calculated to arbitrary precision) must be <= SPAN.  */
8713   if (incr < 0)
8714     {
8715       delta = -incr;
8716       span = initial;
8717     }
8718   else
8719     {
8720       delta = incr;
8721       /* Handle the special case in which MAXIMUM is the largest
8722          unsigned HOST_WIDE_INT and INITIAL is 0.  */
8723       if (maximum + 1 == initial)
8724         span = LOOP_INFO (loop)->n_iterations * delta;
8725       else
8726         span = maximum + 1 - initial;
8727     }
8728   return (span / LOOP_INFO (loop)->n_iterations >= delta);
8729 }
8730
8731
8732 /* Return true if biv BL will never exceed the bounds of MODE.  LOOP is
8733    the loop to which BL belongs and INCR is its per-iteration increment.
8734    UNSIGNEDP is true if the biv should be treated as unsigned.  */
8735
8736 static bool
8737 biv_fits_mode_p (const struct loop *loop, struct iv_class *bl,
8738                  HOST_WIDE_INT incr, enum machine_mode mode, bool unsignedp)
8739 {
8740   struct loop_info *loop_info;
8741   unsigned HOST_WIDE_INT bias;
8742
8743   /* A biv's value will always be limited to its natural mode.
8744      Larger modes will observe the same wrap-around.  */
8745   if (GET_MODE_SIZE (mode) > GET_MODE_SIZE (GET_MODE (bl->biv->src_reg)))
8746     mode = GET_MODE (bl->biv->src_reg);
8747
8748   loop_info = LOOP_INFO (loop);
8749
8750   bias = (unsignedp ? 0 : (GET_MODE_MASK (mode) >> 1) + 1);
8751   if (biased_biv_fits_mode_p (loop, bl, incr, mode, bias))
8752     return true;
8753
8754   if (mode == GET_MODE (bl->biv->src_reg)
8755       && bl->biv->src_reg == loop_info->iteration_var
8756       && loop_info->comparison_value
8757       && loop_invariant_p (loop, loop_info->comparison_value))
8758     {
8759       /* If the increment is +1, and the exit test is a <, the BIV
8760          cannot overflow.  (For <=, we have the problematic case that
8761          the comparison value might be the maximum value of the range.)  */
8762       if (incr == 1)
8763         {
8764           if (loop_info->comparison_code == LT)
8765             return true;
8766           if (loop_info->comparison_code == LTU && unsignedp)
8767             return true;
8768         }
8769
8770       /* Likewise for increment -1 and exit test >.  */
8771       if (incr == -1)
8772         {
8773           if (loop_info->comparison_code == GT)
8774             return true;
8775           if (loop_info->comparison_code == GTU && unsignedp)
8776             return true;
8777         }
8778     }
8779   return false;
8780 }
8781
8782
8783 /* Given that X is an extension or truncation of BL, return true
8784    if it is unaffected by overflow.  LOOP is the loop to which
8785    BL belongs and INCR is its per-iteration increment.  */
8786
8787 static bool
8788 extension_within_bounds_p (const struct loop *loop, struct iv_class *bl,
8789                            HOST_WIDE_INT incr, rtx x)
8790 {
8791   enum machine_mode mode;
8792   bool signedp, unsignedp;
8793
8794   switch (GET_CODE (x))
8795     {
8796     case SIGN_EXTEND:
8797     case ZERO_EXTEND:
8798       mode = GET_MODE (XEXP (x, 0));
8799       signedp = (GET_CODE (x) == SIGN_EXTEND);
8800       unsignedp = (GET_CODE (x) == ZERO_EXTEND);
8801       break;
8802
8803     case TRUNCATE:
8804       /* We don't know whether this value is being used as signed
8805          or unsigned, so check the conditions for both.  */
8806       mode = GET_MODE (x);
8807       signedp = unsignedp = true;
8808       break;
8809
8810     default:
8811       gcc_unreachable ();
8812     }
8813
8814   return ((!signedp || biv_fits_mode_p (loop, bl, incr, mode, false))
8815           && (!unsignedp || biv_fits_mode_p (loop, bl, incr, mode, true)));
8816 }
8817
8818
8819 /* Check each extension dependent giv in this class to see if its
8820    root biv is safe from wrapping in the interior mode, which would
8821    make the giv illegal.  */
8822
8823 static void
8824 check_ext_dependent_givs (const struct loop *loop, struct iv_class *bl)
8825 {
8826   struct induction *v;
8827   HOST_WIDE_INT incr;
8828
8829   incr = get_monotonic_increment (bl);
8830
8831   /* Invalidate givs that fail the tests.  */
8832   for (v = bl->giv; v; v = v->next_iv)
8833     if (v->ext_dependent)
8834       {
8835         if (incr != 0
8836             && extension_within_bounds_p (loop, bl, incr, v->ext_dependent))
8837           {
8838             if (loop_dump_stream)
8839               fprintf (loop_dump_stream,
8840                        "Verified ext dependent giv at %d of reg %d\n",
8841                        INSN_UID (v->insn), bl->regno);
8842           }
8843         else
8844           {
8845             if (loop_dump_stream)
8846               fprintf (loop_dump_stream,
8847                        "Failed ext dependent giv at %d\n",
8848                        INSN_UID (v->insn));
8849
8850             v->ignore = 1;
8851             bl->all_reduced = 0;
8852           }
8853       }
8854 }
8855
8856 /* Generate a version of VALUE in a mode appropriate for initializing V.  */
8857
8858 static rtx
8859 extend_value_for_giv (struct induction *v, rtx value)
8860 {
8861   rtx ext_dep = v->ext_dependent;
8862
8863   if (! ext_dep)
8864     return value;
8865
8866   /* Recall that check_ext_dependent_givs verified that the known bounds
8867      of a biv did not overflow or wrap with respect to the extension for
8868      the giv.  Therefore, constants need no additional adjustment.  */
8869   if (CONSTANT_P (value) && GET_MODE (value) == VOIDmode)
8870     return value;
8871
8872   /* Otherwise, we must adjust the value to compensate for the
8873      differing modes of the biv and the giv.  */
8874   return gen_rtx_fmt_e (GET_CODE (ext_dep), GET_MODE (ext_dep), value);
8875 }
8876 \f
8877 struct combine_givs_stats
8878 {
8879   int giv_number;
8880   int total_benefit;
8881 };
8882
8883 static int
8884 cmp_combine_givs_stats (const void *xp, const void *yp)
8885 {
8886   const struct combine_givs_stats * const x =
8887     (const struct combine_givs_stats *) xp;
8888   const struct combine_givs_stats * const y =
8889     (const struct combine_givs_stats *) yp;
8890   int d;
8891   d = y->total_benefit - x->total_benefit;
8892   /* Stabilize the sort.  */
8893   if (!d)
8894     d = x->giv_number - y->giv_number;
8895   return d;
8896 }
8897
8898 /* Check all pairs of givs for iv_class BL and see if any can be combined with
8899    any other.  If so, point SAME to the giv combined with and set NEW_REG to
8900    be an expression (in terms of the other giv's DEST_REG) equivalent to the
8901    giv.  Also, update BENEFIT and related fields for cost/benefit analysis.  */
8902
8903 static void
8904 combine_givs (struct loop_regs *regs, struct iv_class *bl)
8905 {
8906   /* Additional benefit to add for being combined multiple times.  */
8907   const int extra_benefit = 3;
8908
8909   struct induction *g1, *g2, **giv_array;
8910   int i, j, k, giv_count;
8911   struct combine_givs_stats *stats;
8912   rtx *can_combine;
8913
8914   /* Count givs, because bl->giv_count is incorrect here.  */
8915   giv_count = 0;
8916   for (g1 = bl->giv; g1; g1 = g1->next_iv)
8917     if (!g1->ignore)
8918       giv_count++;
8919
8920   giv_array = alloca (giv_count * sizeof (struct induction *));
8921   i = 0;
8922   for (g1 = bl->giv; g1; g1 = g1->next_iv)
8923     if (!g1->ignore)
8924       giv_array[i++] = g1;
8925
8926   stats = xcalloc (giv_count, sizeof (*stats));
8927   can_combine = xcalloc (giv_count, giv_count * sizeof (rtx));
8928
8929   for (i = 0; i < giv_count; i++)
8930     {
8931       int this_benefit;
8932       rtx single_use;
8933
8934       g1 = giv_array[i];
8935       stats[i].giv_number = i;
8936
8937       /* If a DEST_REG GIV is used only once, do not allow it to combine
8938          with anything, for in doing so we will gain nothing that cannot
8939          be had by simply letting the GIV with which we would have combined
8940          to be reduced on its own.  The lossage shows up in particular with
8941          DEST_ADDR targets on hosts with reg+reg addressing, though it can
8942          be seen elsewhere as well.  */
8943       if (g1->giv_type == DEST_REG
8944           && (single_use = regs->array[REGNO (g1->dest_reg)].single_usage)
8945           && single_use != const0_rtx)
8946         continue;
8947
8948       this_benefit = g1->benefit;
8949       /* Add an additional weight for zero addends.  */
8950       if (g1->no_const_addval)
8951         this_benefit += 1;
8952
8953       for (j = 0; j < giv_count; j++)
8954         {
8955           rtx this_combine;
8956
8957           g2 = giv_array[j];
8958           if (g1 != g2
8959               && (this_combine = combine_givs_p (g1, g2)) != NULL_RTX)
8960             {
8961               can_combine[i * giv_count + j] = this_combine;
8962               this_benefit += g2->benefit + extra_benefit;
8963             }
8964         }
8965       stats[i].total_benefit = this_benefit;
8966     }
8967
8968   /* Iterate, combining until we can't.  */
8969 restart:
8970   qsort (stats, giv_count, sizeof (*stats), cmp_combine_givs_stats);
8971
8972   if (loop_dump_stream)
8973     {
8974       fprintf (loop_dump_stream, "Sorted combine statistics:\n");
8975       for (k = 0; k < giv_count; k++)
8976         {
8977           g1 = giv_array[stats[k].giv_number];
8978           if (!g1->combined_with && !g1->same)
8979             fprintf (loop_dump_stream, " {%d, %d}",
8980                      INSN_UID (giv_array[stats[k].giv_number]->insn),
8981                      stats[k].total_benefit);
8982         }
8983       putc ('\n', loop_dump_stream);
8984     }
8985
8986   for (k = 0; k < giv_count; k++)
8987     {
8988       int g1_add_benefit = 0;
8989
8990       i = stats[k].giv_number;
8991       g1 = giv_array[i];
8992
8993       /* If it has already been combined, skip.  */
8994       if (g1->combined_with || g1->same)
8995         continue;
8996
8997       for (j = 0; j < giv_count; j++)
8998         {
8999           g2 = giv_array[j];
9000           if (g1 != g2 && can_combine[i * giv_count + j]
9001               /* If it has already been combined, skip.  */
9002               && ! g2->same && ! g2->combined_with)
9003             {
9004               int l;
9005
9006               g2->new_reg = can_combine[i * giv_count + j];
9007               g2->same = g1;
9008               /* For destination, we now may replace by mem expression instead
9009                  of register.  This changes the costs considerably, so add the
9010                  compensation.  */
9011               if (g2->giv_type == DEST_ADDR)
9012                 g2->benefit = (g2->benefit + reg_address_cost
9013                                - address_cost (g2->new_reg,
9014                                GET_MODE (g2->mem)));
9015               g1->combined_with++;
9016               g1->lifetime += g2->lifetime;
9017
9018               g1_add_benefit += g2->benefit;
9019
9020               /* ??? The new final_[bg]iv_value code does a much better job
9021                  of finding replaceable giv's, and hence this code may no
9022                  longer be necessary.  */
9023               if (! g2->replaceable && REG_USERVAR_P (g2->dest_reg))
9024                 g1_add_benefit -= copy_cost;
9025
9026               /* To help optimize the next set of combinations, remove
9027                  this giv from the benefits of other potential mates.  */
9028               for (l = 0; l < giv_count; ++l)
9029                 {
9030                   int m = stats[l].giv_number;
9031                   if (can_combine[m * giv_count + j])
9032                     stats[l].total_benefit -= g2->benefit + extra_benefit;
9033                 }
9034
9035               if (loop_dump_stream)
9036                 fprintf (loop_dump_stream,
9037                          "giv at %d combined with giv at %d; new benefit %d + %d, lifetime %d\n",
9038                          INSN_UID (g2->insn), INSN_UID (g1->insn),
9039                          g1->benefit, g1_add_benefit, g1->lifetime);
9040             }
9041         }
9042
9043       /* To help optimize the next set of combinations, remove
9044          this giv from the benefits of other potential mates.  */
9045       if (g1->combined_with)
9046         {
9047           for (j = 0; j < giv_count; ++j)
9048             {
9049               int m = stats[j].giv_number;
9050               if (can_combine[m * giv_count + i])
9051                 stats[j].total_benefit -= g1->benefit + extra_benefit;
9052             }
9053
9054           g1->benefit += g1_add_benefit;
9055
9056           /* We've finished with this giv, and everything it touched.
9057              Restart the combination so that proper weights for the
9058              rest of the givs are properly taken into account.  */
9059           /* ??? Ideally we would compact the arrays at this point, so
9060              as to not cover old ground.  But sanely compacting
9061              can_combine is tricky.  */
9062           goto restart;
9063         }
9064     }
9065
9066   /* Clean up.  */
9067   free (stats);
9068   free (can_combine);
9069 }
9070 \f
9071 /* Generate sequence for REG = B * M + A.  B is the initial value of
9072    the basic induction variable, M a multiplicative constant, A an
9073    additive constant and REG the destination register.  */
9074
9075 static rtx
9076 gen_add_mult (rtx b,  rtx m, rtx a, rtx reg)
9077 {
9078   rtx seq;
9079   rtx result;
9080
9081   start_sequence ();
9082   /* Use unsigned arithmetic.  */
9083   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
9084   if (reg != result)
9085     emit_move_insn (reg, result);
9086   seq = get_insns ();
9087   end_sequence ();
9088
9089   return seq;
9090 }
9091
9092
9093 /* Update registers created in insn sequence SEQ.  */
9094
9095 static void
9096 loop_regs_update (const struct loop *loop ATTRIBUTE_UNUSED, rtx seq)
9097 {
9098   rtx insn;
9099
9100   /* Update register info for alias analysis.  */
9101
9102   insn = seq;
9103   while (insn != NULL_RTX)
9104     {
9105       rtx set = single_set (insn);
9106
9107       if (set && REG_P (SET_DEST (set)))
9108         record_base_value (REGNO (SET_DEST (set)), SET_SRC (set), 0);
9109
9110       insn = NEXT_INSN (insn);
9111     }
9112 }
9113
9114
9115 /* EMIT code before BEFORE_BB/BEFORE_INSN to set REG = B * M + A.  B
9116    is the initial value of the basic induction variable, M a
9117    multiplicative constant, A an additive constant and REG the
9118    destination register.  */
9119
9120 static void
9121 loop_iv_add_mult_emit_before (const struct loop *loop, rtx b, rtx m, rtx a,
9122                               rtx reg, basic_block before_bb, rtx before_insn)
9123 {
9124   rtx seq;
9125
9126   if (! before_insn)
9127     {
9128       loop_iv_add_mult_hoist (loop, b, m, a, reg);
9129       return;
9130     }
9131
9132   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
9133   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
9134
9135   /* Increase the lifetime of any invariants moved further in code.  */
9136   update_reg_last_use (a, before_insn);
9137   update_reg_last_use (b, before_insn);
9138   update_reg_last_use (m, before_insn);
9139
9140   /* It is possible that the expansion created lots of new registers.
9141      Iterate over the sequence we just created and record them all.  We
9142      must do this before inserting the sequence.  */
9143   loop_regs_update (loop, seq);
9144
9145   loop_insn_emit_before (loop, before_bb, before_insn, seq);
9146 }
9147
9148
9149 /* Emit insns in loop pre-header to set REG = B * M + A.  B is the
9150    initial value of the basic induction variable, M a multiplicative
9151    constant, A an additive constant and REG the destination
9152    register.  */
9153
9154 static void
9155 loop_iv_add_mult_sink (const struct loop *loop, rtx b, rtx m, rtx a, rtx reg)
9156 {
9157   rtx seq;
9158
9159   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
9160   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
9161
9162   /* Increase the lifetime of any invariants moved further in code.
9163      ???? Is this really necessary?  */
9164   update_reg_last_use (a, loop->sink);
9165   update_reg_last_use (b, loop->sink);
9166   update_reg_last_use (m, loop->sink);
9167
9168   /* It is possible that the expansion created lots of new registers.
9169      Iterate over the sequence we just created and record them all.  We
9170      must do this before inserting the sequence.  */
9171   loop_regs_update (loop, seq);
9172
9173   loop_insn_sink (loop, seq);
9174 }
9175
9176
9177 /* Emit insns after loop to set REG = B * M + A.  B is the initial
9178    value of the basic induction variable, M a multiplicative constant,
9179    A an additive constant and REG the destination register.  */
9180
9181 static void
9182 loop_iv_add_mult_hoist (const struct loop *loop, rtx b, rtx m, rtx a, rtx reg)
9183 {
9184   rtx seq;
9185
9186   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
9187   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
9188
9189   /* It is possible that the expansion created lots of new registers.
9190      Iterate over the sequence we just created and record them all.  We
9191      must do this before inserting the sequence.  */
9192   loop_regs_update (loop, seq);
9193
9194   loop_insn_hoist (loop, seq);
9195 }
9196
9197
9198
9199 /* Similar to gen_add_mult, but compute cost rather than generating
9200    sequence.  */
9201
9202 static int
9203 iv_add_mult_cost (rtx b, rtx m, rtx a, rtx reg)
9204 {
9205   int cost = 0;
9206   rtx last, result;
9207
9208   start_sequence ();
9209   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
9210   if (reg != result)
9211     emit_move_insn (reg, result);
9212   last = get_last_insn ();
9213   while (last)
9214     {
9215       rtx t = single_set (last);
9216       if (t)
9217         cost += rtx_cost (SET_SRC (t), SET);
9218       last = PREV_INSN (last);
9219     }
9220   end_sequence ();
9221   return cost;
9222 }
9223 \f
9224 /* Test whether A * B can be computed without
9225    an actual multiply insn.  Value is 1 if so.
9226
9227   ??? This function stinks because it generates a ton of wasted RTL
9228   ??? and as a result fragments GC memory to no end.  There are other
9229   ??? places in the compiler which are invoked a lot and do the same
9230   ??? thing, generate wasted RTL just to see if something is possible.  */
9231
9232 static int
9233 product_cheap_p (rtx a, rtx b)
9234 {
9235   rtx tmp;
9236   int win, n_insns;
9237
9238   /* If only one is constant, make it B.  */
9239   if (GET_CODE (a) == CONST_INT)
9240     tmp = a, a = b, b = tmp;
9241
9242   /* If first constant, both constant, so don't need multiply.  */
9243   if (GET_CODE (a) == CONST_INT)
9244     return 1;
9245
9246   /* If second not constant, neither is constant, so would need multiply.  */
9247   if (GET_CODE (b) != CONST_INT)
9248     return 0;
9249
9250   /* One operand is constant, so might not need multiply insn.  Generate the
9251      code for the multiply and see if a call or multiply, or long sequence
9252      of insns is generated.  */
9253
9254   start_sequence ();
9255   expand_mult (GET_MODE (a), a, b, NULL_RTX, 1);
9256   tmp = get_insns ();
9257   end_sequence ();
9258
9259   win = 1;
9260   if (tmp == NULL_RTX)
9261     ;
9262   else if (INSN_P (tmp))
9263     {
9264       n_insns = 0;
9265       while (tmp != NULL_RTX)
9266         {
9267           rtx next = NEXT_INSN (tmp);
9268
9269           if (++n_insns > 3
9270               || !NONJUMP_INSN_P (tmp)
9271               || (GET_CODE (PATTERN (tmp)) == SET
9272                   && GET_CODE (SET_SRC (PATTERN (tmp))) == MULT)
9273               || (GET_CODE (PATTERN (tmp)) == PARALLEL
9274                   && GET_CODE (XVECEXP (PATTERN (tmp), 0, 0)) == SET
9275                   && GET_CODE (SET_SRC (XVECEXP (PATTERN (tmp), 0, 0))) == MULT))
9276             {
9277               win = 0;
9278               break;
9279             }
9280
9281           tmp = next;
9282         }
9283     }
9284   else if (GET_CODE (tmp) == SET
9285            && GET_CODE (SET_SRC (tmp)) == MULT)
9286     win = 0;
9287   else if (GET_CODE (tmp) == PARALLEL
9288            && GET_CODE (XVECEXP (tmp, 0, 0)) == SET
9289            && GET_CODE (SET_SRC (XVECEXP (tmp, 0, 0))) == MULT)
9290     win = 0;
9291
9292   return win;
9293 }
9294 \f
9295 /* Check to see if loop can be terminated by a "decrement and branch until
9296    zero" instruction.  If so, add a REG_NONNEG note to the branch insn if so.
9297    Also try reversing an increment loop to a decrement loop
9298    to see if the optimization can be performed.
9299    Value is nonzero if optimization was performed.  */
9300
9301 /* This is useful even if the architecture doesn't have such an insn,
9302    because it might change a loops which increments from 0 to n to a loop
9303    which decrements from n to 0.  A loop that decrements to zero is usually
9304    faster than one that increments from zero.  */
9305
9306 /* ??? This could be rewritten to use some of the loop unrolling procedures,
9307    such as approx_final_value, biv_total_increment, loop_iterations, and
9308    final_[bg]iv_value.  */
9309
9310 static int
9311 check_dbra_loop (struct loop *loop, int insn_count)
9312 {
9313   struct loop_info *loop_info = LOOP_INFO (loop);
9314   struct loop_regs *regs = LOOP_REGS (loop);
9315   struct loop_ivs *ivs = LOOP_IVS (loop);
9316   struct iv_class *bl;
9317   rtx reg;
9318   enum machine_mode mode;
9319   rtx jump_label;
9320   rtx final_value;
9321   rtx start_value;
9322   rtx new_add_val;
9323   rtx comparison;
9324   rtx before_comparison;
9325   rtx p;
9326   rtx jump;
9327   rtx first_compare;
9328   int compare_and_branch;
9329   rtx loop_start = loop->start;
9330   rtx loop_end = loop->end;
9331
9332   /* If last insn is a conditional branch, and the insn before tests a
9333      register value, try to optimize it.  Otherwise, we can't do anything.  */
9334
9335   jump = PREV_INSN (loop_end);
9336   comparison = get_condition_for_loop (loop, jump);
9337   if (comparison == 0)
9338     return 0;
9339   if (!onlyjump_p (jump))
9340     return 0;
9341
9342   /* Try to compute whether the compare/branch at the loop end is one or
9343      two instructions.  */
9344   get_condition (jump, &first_compare, false, true);
9345   if (first_compare == jump)
9346     compare_and_branch = 1;
9347   else if (first_compare == prev_nonnote_insn (jump))
9348     compare_and_branch = 2;
9349   else
9350     return 0;
9351
9352   {
9353     /* If more than one condition is present to control the loop, then
9354        do not proceed, as this function does not know how to rewrite
9355        loop tests with more than one condition.
9356
9357        Look backwards from the first insn in the last comparison
9358        sequence and see if we've got another comparison sequence.  */
9359
9360     rtx jump1;
9361     if ((jump1 = prev_nonnote_insn (first_compare))
9362         && JUMP_P (jump1))
9363         return 0;
9364   }
9365
9366   /* Check all of the bivs to see if the compare uses one of them.
9367      Skip biv's set more than once because we can't guarantee that
9368      it will be zero on the last iteration.  Also skip if the biv is
9369      used between its update and the test insn.  */
9370
9371   for (bl = ivs->list; bl; bl = bl->next)
9372     {
9373       if (bl->biv_count == 1
9374           && ! bl->biv->maybe_multiple
9375           && bl->biv->dest_reg == XEXP (comparison, 0)
9376           && ! reg_used_between_p (regno_reg_rtx[bl->regno], bl->biv->insn,
9377                                    first_compare))
9378         break;
9379     }
9380
9381   /* Try swapping the comparison to identify a suitable biv.  */
9382   if (!bl)
9383     for (bl = ivs->list; bl; bl = bl->next)
9384       if (bl->biv_count == 1
9385           && ! bl->biv->maybe_multiple
9386           && bl->biv->dest_reg == XEXP (comparison, 1)
9387           && ! reg_used_between_p (regno_reg_rtx[bl->regno], bl->biv->insn,
9388                                    first_compare))
9389         {
9390           comparison = gen_rtx_fmt_ee (swap_condition (GET_CODE (comparison)),
9391                                        VOIDmode,
9392                                        XEXP (comparison, 1),
9393                                        XEXP (comparison, 0));
9394           break;
9395         }
9396
9397   if (! bl)
9398     return 0;
9399
9400   /* Look for the case where the basic induction variable is always
9401      nonnegative, and equals zero on the last iteration.
9402      In this case, add a reg_note REG_NONNEG, which allows the
9403      m68k DBRA instruction to be used.  */
9404
9405   if (((GET_CODE (comparison) == GT && XEXP (comparison, 1) == constm1_rtx)
9406        || (GET_CODE (comparison) == NE && XEXP (comparison, 1) == const0_rtx))
9407       && GET_CODE (bl->biv->add_val) == CONST_INT
9408       && INTVAL (bl->biv->add_val) < 0)
9409     {
9410       /* Initial value must be greater than 0,
9411          init_val % -dec_value == 0 to ensure that it equals zero on
9412          the last iteration */
9413
9414       if (GET_CODE (bl->initial_value) == CONST_INT
9415           && INTVAL (bl->initial_value) > 0
9416           && (INTVAL (bl->initial_value)
9417               % (-INTVAL (bl->biv->add_val))) == 0)
9418         {
9419           /* Register always nonnegative, add REG_NOTE to branch.  */
9420           if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
9421             REG_NOTES (jump)
9422               = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
9423                                    REG_NOTES (jump));
9424           bl->nonneg = 1;
9425
9426           return 1;
9427         }
9428
9429       /* If the decrement is 1 and the value was tested as >= 0 before
9430          the loop, then we can safely optimize.  */
9431       for (p = loop_start; p; p = PREV_INSN (p))
9432         {
9433           if (LABEL_P (p))
9434             break;
9435           if (!JUMP_P (p))
9436             continue;
9437
9438           before_comparison = get_condition_for_loop (loop, p);
9439           if (before_comparison
9440               && XEXP (before_comparison, 0) == bl->biv->dest_reg
9441               && (GET_CODE (before_comparison) == LT
9442                   || GET_CODE (before_comparison) == LTU)
9443               && XEXP (before_comparison, 1) == const0_rtx
9444               && ! reg_set_between_p (bl->biv->dest_reg, p, loop_start)
9445               && INTVAL (bl->biv->add_val) == -1)
9446             {
9447               if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
9448                 REG_NOTES (jump)
9449                   = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
9450                                        REG_NOTES (jump));
9451               bl->nonneg = 1;
9452
9453               return 1;
9454             }
9455         }
9456     }
9457   else if (GET_CODE (bl->biv->add_val) == CONST_INT
9458            && INTVAL (bl->biv->add_val) > 0)
9459     {
9460       /* Try to change inc to dec, so can apply above optimization.  */
9461       /* Can do this if:
9462          all registers modified are induction variables or invariant,
9463          all memory references have non-overlapping addresses
9464          (obviously true if only one write)
9465          allow 2 insns for the compare/jump at the end of the loop.  */
9466       /* Also, we must avoid any instructions which use both the reversed
9467          biv and another biv.  Such instructions will fail if the loop is
9468          reversed.  We meet this condition by requiring that either
9469          no_use_except_counting is true, or else that there is only
9470          one biv.  */
9471       int num_nonfixed_reads = 0;
9472       /* 1 if the iteration var is used only to count iterations.  */
9473       int no_use_except_counting = 0;
9474       /* 1 if the loop has no memory store, or it has a single memory store
9475          which is reversible.  */
9476       int reversible_mem_store = 1;
9477
9478       if (bl->giv_count == 0
9479           && !loop->exit_count
9480           && !loop_info->has_multiple_exit_targets)
9481         {
9482           rtx bivreg = regno_reg_rtx[bl->regno];
9483           struct iv_class *blt;
9484
9485           /* If there are no givs for this biv, and the only exit is the
9486              fall through at the end of the loop, then
9487              see if perhaps there are no uses except to count.  */
9488           no_use_except_counting = 1;
9489           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
9490             if (INSN_P (p))
9491               {
9492                 rtx set = single_set (p);
9493
9494                 if (set && REG_P (SET_DEST (set))
9495                     && REGNO (SET_DEST (set)) == bl->regno)
9496                   /* An insn that sets the biv is okay.  */
9497                   ;
9498                 else if (!reg_mentioned_p (bivreg, PATTERN (p)))
9499                   /* An insn that doesn't mention the biv is okay.  */
9500                   ;
9501                 else if (p == prev_nonnote_insn (prev_nonnote_insn (loop_end))
9502                          || p == prev_nonnote_insn (loop_end))
9503                   {
9504                     /* If either of these insns uses the biv and sets a pseudo
9505                        that has more than one usage, then the biv has uses
9506                        other than counting since it's used to derive a value
9507                        that is used more than one time.  */
9508                     note_stores (PATTERN (p), note_set_pseudo_multiple_uses,
9509                                  regs);
9510                     if (regs->multiple_uses)
9511                       {
9512                         no_use_except_counting = 0;
9513                         break;
9514                       }
9515                   }
9516                 else
9517                   {
9518                     no_use_except_counting = 0;
9519                     break;
9520                   }
9521               }
9522
9523           /* A biv has uses besides counting if it is used to set
9524              another biv.  */
9525           for (blt = ivs->list; blt; blt = blt->next)
9526             if (blt->init_set
9527                 && reg_mentioned_p (bivreg, SET_SRC (blt->init_set)))
9528               {
9529                 no_use_except_counting = 0;
9530                 break;
9531               }
9532         }
9533
9534       if (no_use_except_counting)
9535         /* No need to worry about MEMs.  */
9536         ;
9537       else if (loop_info->num_mem_sets <= 1)
9538         {
9539           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
9540             if (INSN_P (p))
9541               num_nonfixed_reads += count_nonfixed_reads (loop, PATTERN (p));
9542
9543           /* If the loop has a single store, and the destination address is
9544              invariant, then we can't reverse the loop, because this address
9545              might then have the wrong value at loop exit.
9546              This would work if the source was invariant also, however, in that
9547              case, the insn should have been moved out of the loop.  */
9548
9549           if (loop_info->num_mem_sets == 1)
9550             {
9551               struct induction *v;
9552
9553               /* If we could prove that each of the memory locations
9554                  written to was different, then we could reverse the
9555                  store -- but we don't presently have any way of
9556                  knowing that.  */
9557               reversible_mem_store = 0;
9558
9559               /* If the store depends on a register that is set after the
9560                  store, it depends on the initial value, and is thus not
9561                  reversible.  */
9562               for (v = bl->giv; reversible_mem_store && v; v = v->next_iv)
9563                 {
9564                   if (v->giv_type == DEST_REG
9565                       && reg_mentioned_p (v->dest_reg,
9566                                           PATTERN (loop_info->first_loop_store_insn))
9567                       && loop_insn_first_p (loop_info->first_loop_store_insn,
9568                                             v->insn))
9569                     reversible_mem_store = 0;
9570                 }
9571             }
9572         }
9573       else
9574         return 0;
9575
9576       /* This code only acts for innermost loops.  Also it simplifies
9577          the memory address check by only reversing loops with
9578          zero or one memory access.
9579          Two memory accesses could involve parts of the same array,
9580          and that can't be reversed.
9581          If the biv is used only for counting, than we don't need to worry
9582          about all these things.  */
9583
9584       if ((num_nonfixed_reads <= 1
9585            && ! loop_info->has_nonconst_call
9586            && ! loop_info->has_prefetch
9587            && ! loop_info->has_volatile
9588            && reversible_mem_store
9589            && (bl->giv_count + bl->biv_count + loop_info->num_mem_sets
9590                + num_unmoved_movables (loop) + compare_and_branch == insn_count)
9591            && (bl == ivs->list && bl->next == 0))
9592           || (no_use_except_counting && ! loop_info->has_prefetch))
9593         {
9594           rtx tem;
9595
9596           /* Loop can be reversed.  */
9597           if (loop_dump_stream)
9598             fprintf (loop_dump_stream, "Can reverse loop\n");
9599
9600           /* Now check other conditions:
9601
9602              The increment must be a constant, as must the initial value,
9603              and the comparison code must be LT.
9604
9605              This test can probably be improved since +/- 1 in the constant
9606              can be obtained by changing LT to LE and vice versa; this is
9607              confusing.  */
9608
9609           if (comparison
9610               /* for constants, LE gets turned into LT */
9611               && (GET_CODE (comparison) == LT
9612                   || (GET_CODE (comparison) == LE
9613                       && no_use_except_counting)
9614                   || GET_CODE (comparison) == LTU))
9615             {
9616               HOST_WIDE_INT add_val, add_adjust, comparison_val = 0;
9617               rtx initial_value, comparison_value;
9618               int nonneg = 0;
9619               enum rtx_code cmp_code;
9620               int comparison_const_width;
9621               unsigned HOST_WIDE_INT comparison_sign_mask;
9622               bool keep_first_compare;
9623
9624               add_val = INTVAL (bl->biv->add_val);
9625               comparison_value = XEXP (comparison, 1);
9626               if (GET_MODE (comparison_value) == VOIDmode)
9627                 comparison_const_width
9628                   = GET_MODE_BITSIZE (GET_MODE (XEXP (comparison, 0)));
9629               else
9630                 comparison_const_width
9631                   = GET_MODE_BITSIZE (GET_MODE (comparison_value));
9632               if (comparison_const_width > HOST_BITS_PER_WIDE_INT)
9633                 comparison_const_width = HOST_BITS_PER_WIDE_INT;
9634               comparison_sign_mask
9635                 = (unsigned HOST_WIDE_INT) 1 << (comparison_const_width - 1);
9636
9637               /* If the comparison value is not a loop invariant, then we
9638                  can not reverse this loop.
9639
9640                  ??? If the insns which initialize the comparison value as
9641                  a whole compute an invariant result, then we could move
9642                  them out of the loop and proceed with loop reversal.  */
9643               if (! loop_invariant_p (loop, comparison_value))
9644                 return 0;
9645
9646               if (GET_CODE (comparison_value) == CONST_INT)
9647                 comparison_val = INTVAL (comparison_value);
9648               initial_value = bl->initial_value;
9649
9650               /* Normalize the initial value if it is an integer and
9651                  has no other use except as a counter.  This will allow
9652                  a few more loops to be reversed.  */
9653               if (no_use_except_counting
9654                   && GET_CODE (comparison_value) == CONST_INT
9655                   && GET_CODE (initial_value) == CONST_INT)
9656                 {
9657                   comparison_val = comparison_val - INTVAL (bl->initial_value);
9658                   /* The code below requires comparison_val to be a multiple
9659                      of add_val in order to do the loop reversal, so
9660                      round up comparison_val to a multiple of add_val.
9661                      Since comparison_value is constant, we know that the
9662                      current comparison code is LT.  */
9663                   comparison_val = comparison_val + add_val - 1;
9664                   comparison_val
9665                     -= (unsigned HOST_WIDE_INT) comparison_val % add_val;
9666                   /* We postpone overflow checks for COMPARISON_VAL here;
9667                      even if there is an overflow, we might still be able to
9668                      reverse the loop, if converting the loop exit test to
9669                      NE is possible.  */
9670                   initial_value = const0_rtx;
9671                 }
9672
9673               /* First check if we can do a vanilla loop reversal.  */
9674               if (initial_value == const0_rtx
9675                   && GET_CODE (comparison_value) == CONST_INT
9676                      /* Now do postponed overflow checks on COMPARISON_VAL.  */
9677                   && ! (((comparison_val - add_val) ^ INTVAL (comparison_value))
9678                         & comparison_sign_mask))
9679                 {
9680                   /* Register will always be nonnegative, with value
9681                      0 on last iteration */
9682                   add_adjust = add_val;
9683                   nonneg = 1;
9684                   cmp_code = GE;
9685                 }
9686               else
9687                 return 0;
9688
9689               if (GET_CODE (comparison) == LE)
9690                 add_adjust -= add_val;
9691
9692               /* If the initial value is not zero, or if the comparison
9693                  value is not an exact multiple of the increment, then we
9694                  can not reverse this loop.  */
9695               if (initial_value == const0_rtx
9696                   && GET_CODE (comparison_value) == CONST_INT)
9697                 {
9698                   if (((unsigned HOST_WIDE_INT) comparison_val % add_val) != 0)
9699                     return 0;
9700                 }
9701               else
9702                 {
9703                   if (! no_use_except_counting || add_val != 1)
9704                     return 0;
9705                 }
9706
9707               final_value = comparison_value;
9708
9709               /* Reset these in case we normalized the initial value
9710                  and comparison value above.  */
9711               if (GET_CODE (comparison_value) == CONST_INT
9712                   && GET_CODE (initial_value) == CONST_INT)
9713                 {
9714                   comparison_value = GEN_INT (comparison_val);
9715                   final_value
9716                     = GEN_INT (comparison_val + INTVAL (bl->initial_value));
9717                 }
9718               bl->initial_value = initial_value;
9719
9720               /* Save some info needed to produce the new insns.  */
9721               reg = bl->biv->dest_reg;
9722               mode = GET_MODE (reg);
9723               jump_label = condjump_label (PREV_INSN (loop_end));
9724               new_add_val = GEN_INT (-INTVAL (bl->biv->add_val));
9725
9726               /* Set start_value; if this is not a CONST_INT, we need
9727                  to generate a SUB.
9728                  Initialize biv to start_value before loop start.
9729                  The old initializing insn will be deleted as a
9730                  dead store by flow.c.  */
9731               if (initial_value == const0_rtx
9732                   && GET_CODE (comparison_value) == CONST_INT)
9733                 {
9734                   start_value
9735                     = gen_int_mode (comparison_val - add_adjust, mode);
9736                   loop_insn_hoist (loop, gen_move_insn (reg, start_value));
9737                 }
9738               else if (GET_CODE (initial_value) == CONST_INT)
9739                 {
9740                   rtx offset = GEN_INT (-INTVAL (initial_value) - add_adjust);
9741                   rtx add_insn = gen_add3_insn (reg, comparison_value, offset);
9742
9743                   if (add_insn == 0)
9744                     return 0;
9745
9746                   start_value
9747                     = gen_rtx_PLUS (mode, comparison_value, offset);
9748                   loop_insn_hoist (loop, add_insn);
9749                   if (GET_CODE (comparison) == LE)
9750                     final_value = gen_rtx_PLUS (mode, comparison_value,
9751                                                 GEN_INT (add_val));
9752                 }
9753               else if (! add_adjust)
9754                 {
9755                   rtx sub_insn = gen_sub3_insn (reg, comparison_value,
9756                                                 initial_value);
9757
9758                   if (sub_insn == 0)
9759                     return 0;
9760                   start_value
9761                     = gen_rtx_MINUS (mode, comparison_value, initial_value);
9762                   loop_insn_hoist (loop, sub_insn);
9763                 }
9764               else
9765                 /* We could handle the other cases too, but it'll be
9766                    better to have a testcase first.  */
9767                 return 0;
9768
9769               /* We may not have a single insn which can increment a reg, so
9770                  create a sequence to hold all the insns from expand_inc.  */
9771               start_sequence ();
9772               expand_inc (reg, new_add_val);
9773               tem = get_insns ();
9774               end_sequence ();
9775
9776               p = loop_insn_emit_before (loop, 0, bl->biv->insn, tem);
9777               delete_insn (bl->biv->insn);
9778
9779               /* Update biv info to reflect its new status.  */
9780               bl->biv->insn = p;
9781               bl->initial_value = start_value;
9782               bl->biv->add_val = new_add_val;
9783
9784               /* Update loop info.  */
9785               loop_info->initial_value = reg;
9786               loop_info->initial_equiv_value = reg;
9787               loop_info->final_value = const0_rtx;
9788               loop_info->final_equiv_value = const0_rtx;
9789               loop_info->comparison_value = const0_rtx;
9790               loop_info->comparison_code = cmp_code;
9791               loop_info->increment = new_add_val;
9792
9793               /* Inc LABEL_NUSES so that delete_insn will
9794                  not delete the label.  */
9795               LABEL_NUSES (XEXP (jump_label, 0))++;
9796
9797               /* If we have a separate comparison insn that does more
9798                  than just set cc0, the result of the comparison might
9799                  be used outside the loop.  */
9800               keep_first_compare = (compare_and_branch == 2
9801 #ifdef HAVE_CC0
9802                                     && sets_cc0_p (first_compare) <= 0
9803 #endif
9804                                     );
9805
9806               /* Emit an insn after the end of the loop to set the biv's
9807                  proper exit value if it is used anywhere outside the loop.  */
9808               if (keep_first_compare
9809                   || (REGNO_LAST_UID (bl->regno) != INSN_UID (first_compare))
9810                   || ! bl->init_insn
9811                   || REGNO_FIRST_UID (bl->regno) != INSN_UID (bl->init_insn))
9812                 loop_insn_sink (loop, gen_load_of_final_value (reg, final_value));
9813
9814               if (keep_first_compare)
9815                 loop_insn_sink (loop, PATTERN (first_compare));
9816
9817               /* Delete compare/branch at end of loop.  */
9818               delete_related_insns (PREV_INSN (loop_end));
9819               if (compare_and_branch == 2)
9820                 delete_related_insns (first_compare);
9821
9822               /* Add new compare/branch insn at end of loop.  */
9823               start_sequence ();
9824               emit_cmp_and_jump_insns (reg, const0_rtx, cmp_code, NULL_RTX,
9825                                        mode, 0,
9826                                        XEXP (jump_label, 0));
9827               tem = get_insns ();
9828               end_sequence ();
9829               emit_jump_insn_before (tem, loop_end);
9830
9831               for (tem = PREV_INSN (loop_end);
9832                    tem && !JUMP_P (tem);
9833                    tem = PREV_INSN (tem))
9834                 ;
9835
9836               if (tem)
9837                 JUMP_LABEL (tem) = XEXP (jump_label, 0);
9838
9839               if (nonneg)
9840                 {
9841                   if (tem)
9842                     {
9843                       /* Increment of LABEL_NUSES done above.  */
9844                       /* Register is now always nonnegative,
9845                          so add REG_NONNEG note to the branch.  */
9846                       REG_NOTES (tem) = gen_rtx_EXPR_LIST (REG_NONNEG, reg,
9847                                                            REG_NOTES (tem));
9848                     }
9849                   bl->nonneg = 1;
9850                 }
9851
9852               /* No insn may reference both the reversed and another biv or it
9853                  will fail (see comment near the top of the loop reversal
9854                  code).
9855                  Earlier on, we have verified that the biv has no use except
9856                  counting, or it is the only biv in this function.
9857                  However, the code that computes no_use_except_counting does
9858                  not verify reg notes.  It's possible to have an insn that
9859                  references another biv, and has a REG_EQUAL note with an
9860                  expression based on the reversed biv.  To avoid this case,
9861                  remove all REG_EQUAL notes based on the reversed biv
9862                  here.  */
9863               for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
9864                 if (INSN_P (p))
9865                   {
9866                     rtx *pnote;
9867                     rtx set = single_set (p);
9868                     /* If this is a set of a GIV based on the reversed biv, any
9869                        REG_EQUAL notes should still be correct.  */
9870                     if (! set
9871                         || !REG_P (SET_DEST (set))
9872                         || (size_t) REGNO (SET_DEST (set)) >= ivs->n_regs
9873                         || REG_IV_TYPE (ivs, REGNO (SET_DEST (set))) != GENERAL_INDUCT
9874                         || REG_IV_INFO (ivs, REGNO (SET_DEST (set)))->src_reg != bl->biv->src_reg)
9875                       for (pnote = &REG_NOTES (p); *pnote;)
9876                         {
9877                           if (REG_NOTE_KIND (*pnote) == REG_EQUAL
9878                               && reg_mentioned_p (regno_reg_rtx[bl->regno],
9879                                                   XEXP (*pnote, 0)))
9880                             *pnote = XEXP (*pnote, 1);
9881                           else
9882                             pnote = &XEXP (*pnote, 1);
9883                         }
9884                   }
9885
9886               /* Mark that this biv has been reversed.  Each giv which depends
9887                  on this biv, and which is also live past the end of the loop
9888                  will have to be fixed up.  */
9889
9890               bl->reversed = 1;
9891
9892               if (loop_dump_stream)
9893                 {
9894                   fprintf (loop_dump_stream, "Reversed loop");
9895                   if (bl->nonneg)
9896                     fprintf (loop_dump_stream, " and added reg_nonneg\n");
9897                   else
9898                     fprintf (loop_dump_stream, "\n");
9899                 }
9900
9901               return 1;
9902             }
9903         }
9904     }
9905
9906   return 0;
9907 }
9908 \f
9909 /* Verify whether the biv BL appears to be eliminable,
9910    based on the insns in the loop that refer to it.
9911
9912    If ELIMINATE_P is nonzero, actually do the elimination.
9913
9914    THRESHOLD and INSN_COUNT are from loop_optimize and are used to
9915    determine whether invariant insns should be placed inside or at the
9916    start of the loop.  */
9917
9918 static int
9919 maybe_eliminate_biv (const struct loop *loop, struct iv_class *bl,
9920                      int eliminate_p, int threshold, int insn_count)
9921 {
9922   struct loop_ivs *ivs = LOOP_IVS (loop);
9923   rtx reg = bl->biv->dest_reg;
9924   rtx p;
9925
9926   /* Scan all insns in the loop, stopping if we find one that uses the
9927      biv in a way that we cannot eliminate.  */
9928
9929   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
9930     {
9931       enum rtx_code code = GET_CODE (p);
9932       basic_block where_bb = 0;
9933       rtx where_insn = threshold >= insn_count ? 0 : p;
9934       rtx note;
9935
9936       /* If this is a libcall that sets a giv, skip ahead to its end.  */
9937       if (INSN_P (p))
9938         {
9939           note = find_reg_note (p, REG_LIBCALL, NULL_RTX);
9940
9941           if (note)
9942             {
9943               rtx last = XEXP (note, 0);
9944               rtx set = single_set (last);
9945
9946               if (set && REG_P (SET_DEST (set)))
9947                 {
9948                   unsigned int regno = REGNO (SET_DEST (set));
9949
9950                   if (regno < ivs->n_regs
9951                       && REG_IV_TYPE (ivs, regno) == GENERAL_INDUCT
9952                       && REG_IV_INFO (ivs, regno)->src_reg == bl->biv->src_reg)
9953                     p = last;
9954                 }
9955             }
9956         }
9957
9958       /* Closely examine the insn if the biv is mentioned.  */
9959       if ((code == INSN || code == JUMP_INSN || code == CALL_INSN)
9960           && reg_mentioned_p (reg, PATTERN (p))
9961           && ! maybe_eliminate_biv_1 (loop, PATTERN (p), p, bl,
9962                                       eliminate_p, where_bb, where_insn))
9963         {
9964           if (loop_dump_stream)
9965             fprintf (loop_dump_stream,
9966                      "Cannot eliminate biv %d: biv used in insn %d.\n",
9967                      bl->regno, INSN_UID (p));
9968           break;
9969         }
9970
9971       /* If we are eliminating, kill REG_EQUAL notes mentioning the biv.  */
9972       if (eliminate_p
9973           && (note = find_reg_note (p, REG_EQUAL, NULL_RTX)) != NULL_RTX
9974           && reg_mentioned_p (reg, XEXP (note, 0)))
9975         remove_note (p, note);
9976     }
9977
9978   if (p == loop->end)
9979     {
9980       if (loop_dump_stream)
9981         fprintf (loop_dump_stream, "biv %d %s eliminated.\n",
9982                  bl->regno, eliminate_p ? "was" : "can be");
9983       return 1;
9984     }
9985
9986   return 0;
9987 }
9988 \f
9989 /* INSN and REFERENCE are instructions in the same insn chain.
9990    Return nonzero if INSN is first.  */
9991
9992 static int
9993 loop_insn_first_p (rtx insn, rtx reference)
9994 {
9995   rtx p, q;
9996
9997   for (p = insn, q = reference;;)
9998     {
9999       /* Start with test for not first so that INSN == REFERENCE yields not
10000          first.  */
10001       if (q == insn || ! p)
10002         return 0;
10003       if (p == reference || ! q)
10004         return 1;
10005
10006       /* Either of P or Q might be a NOTE.  Notes have the same LUID as the
10007          previous insn, hence the <= comparison below does not work if
10008          P is a note.  */
10009       if (INSN_UID (p) < max_uid_for_loop
10010           && INSN_UID (q) < max_uid_for_loop
10011           && !NOTE_P (p))
10012         return INSN_LUID (p) <= INSN_LUID (q);
10013
10014       if (INSN_UID (p) >= max_uid_for_loop
10015           || NOTE_P (p))
10016         p = NEXT_INSN (p);
10017       if (INSN_UID (q) >= max_uid_for_loop)
10018         q = NEXT_INSN (q);
10019     }
10020 }
10021
10022 /* We are trying to eliminate BIV in INSN using GIV.  Return nonzero if
10023    the offset that we have to take into account due to auto-increment /
10024    div derivation is zero.  */
10025 static int
10026 biv_elimination_giv_has_0_offset (struct induction *biv,
10027                                   struct induction *giv, rtx insn)
10028 {
10029   /* If the giv V had the auto-inc address optimization applied
10030      to it, and INSN occurs between the giv insn and the biv
10031      insn, then we'd have to adjust the value used here.
10032      This is rare, so we don't bother to make this possible.  */
10033   if (giv->auto_inc_opt
10034       && ((loop_insn_first_p (giv->insn, insn)
10035            && loop_insn_first_p (insn, biv->insn))
10036           || (loop_insn_first_p (biv->insn, insn)
10037               && loop_insn_first_p (insn, giv->insn))))
10038     return 0;
10039
10040   return 1;
10041 }
10042
10043 /* If BL appears in X (part of the pattern of INSN), see if we can
10044    eliminate its use.  If so, return 1.  If not, return 0.
10045
10046    If BIV does not appear in X, return 1.
10047
10048    If ELIMINATE_P is nonzero, actually do the elimination.
10049    WHERE_INSN/WHERE_BB indicate where extra insns should be added.
10050    Depending on how many items have been moved out of the loop, it
10051    will either be before INSN (when WHERE_INSN is nonzero) or at the
10052    start of the loop (when WHERE_INSN is zero).  */
10053
10054 static int
10055 maybe_eliminate_biv_1 (const struct loop *loop, rtx x, rtx insn,
10056                        struct iv_class *bl, int eliminate_p,
10057                        basic_block where_bb, rtx where_insn)
10058 {
10059   enum rtx_code code = GET_CODE (x);
10060   rtx reg = bl->biv->dest_reg;
10061   enum machine_mode mode = GET_MODE (reg);
10062   struct induction *v;
10063   rtx arg, tem;
10064 #ifdef HAVE_cc0
10065   rtx new;
10066 #endif
10067   int arg_operand;
10068   const char *fmt;
10069   int i, j;
10070
10071   switch (code)
10072     {
10073     case REG:
10074       /* If we haven't already been able to do something with this BIV,
10075          we can't eliminate it.  */
10076       if (x == reg)
10077         return 0;
10078       return 1;
10079
10080     case SET:
10081       /* If this sets the BIV, it is not a problem.  */
10082       if (SET_DEST (x) == reg)
10083         return 1;
10084
10085       /* If this is an insn that defines a giv, it is also ok because
10086          it will go away when the giv is reduced.  */
10087       for (v = bl->giv; v; v = v->next_iv)
10088         if (v->giv_type == DEST_REG && SET_DEST (x) == v->dest_reg)
10089           return 1;
10090
10091 #ifdef HAVE_cc0
10092       if (SET_DEST (x) == cc0_rtx && SET_SRC (x) == reg)
10093         {
10094           /* Can replace with any giv that was reduced and
10095              that has (MULT_VAL != 0) and (ADD_VAL == 0).
10096              Require a constant for MULT_VAL, so we know it's nonzero.
10097              ??? We disable this optimization to avoid potential
10098              overflows.  */
10099
10100           for (v = bl->giv; v; v = v->next_iv)
10101             if (GET_CODE (v->mult_val) == CONST_INT && v->mult_val != const0_rtx
10102                 && v->add_val == const0_rtx
10103                 && ! v->ignore && ! v->maybe_dead && v->always_computable
10104                 && v->mode == mode
10105                 && 0)
10106               {
10107                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10108                   continue;
10109
10110                 if (! eliminate_p)
10111                   return 1;
10112
10113                 /* If the giv has the opposite direction of change,
10114                    then reverse the comparison.  */
10115                 if (INTVAL (v->mult_val) < 0)
10116                   new = gen_rtx_COMPARE (GET_MODE (v->new_reg),
10117                                          const0_rtx, v->new_reg);
10118                 else
10119                   new = v->new_reg;
10120
10121                 /* We can probably test that giv's reduced reg.  */
10122                 if (validate_change (insn, &SET_SRC (x), new, 0))
10123                   return 1;
10124               }
10125
10126           /* Look for a giv with (MULT_VAL != 0) and (ADD_VAL != 0);
10127              replace test insn with a compare insn (cmp REDUCED_GIV ADD_VAL).
10128              Require a constant for MULT_VAL, so we know it's nonzero.
10129              ??? Do this only if ADD_VAL is a pointer to avoid a potential
10130              overflow problem.  */
10131
10132           for (v = bl->giv; v; v = v->next_iv)
10133             if (GET_CODE (v->mult_val) == CONST_INT
10134                 && v->mult_val != const0_rtx
10135                 && ! v->ignore && ! v->maybe_dead && v->always_computable
10136                 && v->mode == mode
10137                 && (GET_CODE (v->add_val) == SYMBOL_REF
10138                     || GET_CODE (v->add_val) == LABEL_REF
10139                     || GET_CODE (v->add_val) == CONST
10140                     || (REG_P (v->add_val)
10141                         && REG_POINTER (v->add_val))))
10142               {
10143                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10144                   continue;
10145
10146                 if (! eliminate_p)
10147                   return 1;
10148
10149                 /* If the giv has the opposite direction of change,
10150                    then reverse the comparison.  */
10151                 if (INTVAL (v->mult_val) < 0)
10152                   new = gen_rtx_COMPARE (VOIDmode, copy_rtx (v->add_val),
10153                                          v->new_reg);
10154                 else
10155                   new = gen_rtx_COMPARE (VOIDmode, v->new_reg,
10156                                          copy_rtx (v->add_val));
10157
10158                 /* Replace biv with the giv's reduced register.  */
10159                 update_reg_last_use (v->add_val, insn);
10160                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
10161                   return 1;
10162
10163                 /* Insn doesn't support that constant or invariant.  Copy it
10164                    into a register (it will be a loop invariant.)  */
10165                 tem = gen_reg_rtx (GET_MODE (v->new_reg));
10166
10167                 loop_insn_emit_before (loop, 0, where_insn,
10168                                        gen_move_insn (tem,
10169                                                       copy_rtx (v->add_val)));
10170
10171                 /* Substitute the new register for its invariant value in
10172                    the compare expression.  */
10173                 XEXP (new, (INTVAL (v->mult_val) < 0) ? 0 : 1) = tem;
10174                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
10175                   return 1;
10176               }
10177         }
10178 #endif
10179       break;
10180
10181     case COMPARE:
10182     case EQ:  case NE:
10183     case GT:  case GE:  case GTU:  case GEU:
10184     case LT:  case LE:  case LTU:  case LEU:
10185       /* See if either argument is the biv.  */
10186       if (XEXP (x, 0) == reg)
10187         arg = XEXP (x, 1), arg_operand = 1;
10188       else if (XEXP (x, 1) == reg)
10189         arg = XEXP (x, 0), arg_operand = 0;
10190       else
10191         break;
10192
10193       if (CONSTANT_P (arg))
10194         {
10195           /* First try to replace with any giv that has constant positive
10196              mult_val and constant add_val.  We might be able to support
10197              negative mult_val, but it seems complex to do it in general.  */
10198
10199           for (v = bl->giv; v; v = v->next_iv)
10200             if (GET_CODE (v->mult_val) == CONST_INT
10201                 && INTVAL (v->mult_val) > 0
10202                 && (GET_CODE (v->add_val) == SYMBOL_REF
10203                     || GET_CODE (v->add_val) == LABEL_REF
10204                     || GET_CODE (v->add_val) == CONST
10205                     || (REG_P (v->add_val)
10206                         && REG_POINTER (v->add_val)))
10207                 && ! v->ignore && ! v->maybe_dead && v->always_computable
10208                 && v->mode == mode)
10209               {
10210                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10211                   continue;
10212
10213                 /* Don't eliminate if the linear combination that makes up
10214                    the giv overflows when it is applied to ARG.  */
10215                 if (GET_CODE (arg) == CONST_INT)
10216                   {
10217                     rtx add_val;
10218
10219                     if (GET_CODE (v->add_val) == CONST_INT)
10220                       add_val = v->add_val;
10221                     else
10222                       add_val = const0_rtx;
10223
10224                     if (const_mult_add_overflow_p (arg, v->mult_val,
10225                                                    add_val, mode, 1))
10226                       continue;
10227                   }
10228
10229                 if (! eliminate_p)
10230                   return 1;
10231
10232                 /* Replace biv with the giv's reduced reg.  */
10233                 validate_change (insn, &XEXP (x, 1 - arg_operand), v->new_reg, 1);
10234
10235                 /* If all constants are actually constant integers and
10236                    the derived constant can be directly placed in the COMPARE,
10237                    do so.  */
10238                 if (GET_CODE (arg) == CONST_INT
10239                     && GET_CODE (v->add_val) == CONST_INT)
10240                   {
10241                     tem = expand_mult_add (arg, NULL_RTX, v->mult_val,
10242                                            v->add_val, mode, 1);
10243                   }
10244                 else
10245                   {
10246                     /* Otherwise, load it into a register.  */
10247                     tem = gen_reg_rtx (mode);
10248                     loop_iv_add_mult_emit_before (loop, arg,
10249                                                   v->mult_val, v->add_val,
10250                                                   tem, where_bb, where_insn);
10251                   }
10252
10253                 validate_change (insn, &XEXP (x, arg_operand), tem, 1);
10254
10255                 if (apply_change_group ())
10256                   return 1;
10257               }
10258
10259           /* Look for giv with positive constant mult_val and nonconst add_val.
10260              Insert insns to calculate new compare value.
10261              ??? Turn this off due to possible overflow.  */
10262
10263           for (v = bl->giv; v; v = v->next_iv)
10264             if (GET_CODE (v->mult_val) == CONST_INT
10265                 && INTVAL (v->mult_val) > 0
10266                 && ! v->ignore && ! v->maybe_dead && v->always_computable
10267                 && v->mode == mode
10268                 && 0)
10269               {
10270                 rtx tem;
10271
10272                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10273                   continue;
10274
10275                 if (! eliminate_p)
10276                   return 1;
10277
10278                 tem = gen_reg_rtx (mode);
10279
10280                 /* Replace biv with giv's reduced register.  */
10281                 validate_change (insn, &XEXP (x, 1 - arg_operand),
10282                                  v->new_reg, 1);
10283
10284                 /* Compute value to compare against.  */
10285                 loop_iv_add_mult_emit_before (loop, arg,
10286                                               v->mult_val, v->add_val,
10287                                               tem, where_bb, where_insn);
10288                 /* Use it in this insn.  */
10289                 validate_change (insn, &XEXP (x, arg_operand), tem, 1);
10290                 if (apply_change_group ())
10291                   return 1;
10292               }
10293         }
10294       else if (REG_P (arg) || MEM_P (arg))
10295         {
10296           if (loop_invariant_p (loop, arg) == 1)
10297             {
10298               /* Look for giv with constant positive mult_val and nonconst
10299                  add_val. Insert insns to compute new compare value.
10300                  ??? Turn this off due to possible overflow.  */
10301
10302               for (v = bl->giv; v; v = v->next_iv)
10303                 if (GET_CODE (v->mult_val) == CONST_INT && INTVAL (v->mult_val) > 0
10304                     && ! v->ignore && ! v->maybe_dead && v->always_computable
10305                     && v->mode == mode
10306                     && 0)
10307                   {
10308                     rtx tem;
10309
10310                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10311                       continue;
10312
10313                     if (! eliminate_p)
10314                       return 1;
10315
10316                     tem = gen_reg_rtx (mode);
10317
10318                     /* Replace biv with giv's reduced register.  */
10319                     validate_change (insn, &XEXP (x, 1 - arg_operand),
10320                                      v->new_reg, 1);
10321
10322                     /* Compute value to compare against.  */
10323                     loop_iv_add_mult_emit_before (loop, arg,
10324                                                   v->mult_val, v->add_val,
10325                                                   tem, where_bb, where_insn);
10326                     validate_change (insn, &XEXP (x, arg_operand), tem, 1);
10327                     if (apply_change_group ())
10328                       return 1;
10329                   }
10330             }
10331
10332           /* This code has problems.  Basically, you can't know when
10333              seeing if we will eliminate BL, whether a particular giv
10334              of ARG will be reduced.  If it isn't going to be reduced,
10335              we can't eliminate BL.  We can try forcing it to be reduced,
10336              but that can generate poor code.
10337
10338              The problem is that the benefit of reducing TV, below should
10339              be increased if BL can actually be eliminated, but this means
10340              we might have to do a topological sort of the order in which
10341              we try to process biv.  It doesn't seem worthwhile to do
10342              this sort of thing now.  */
10343
10344 #if 0
10345           /* Otherwise the reg compared with had better be a biv.  */
10346           if (!REG_P (arg)
10347               || REG_IV_TYPE (ivs, REGNO (arg)) != BASIC_INDUCT)
10348             return 0;
10349
10350           /* Look for a pair of givs, one for each biv,
10351              with identical coefficients.  */
10352           for (v = bl->giv; v; v = v->next_iv)
10353             {
10354               struct induction *tv;
10355
10356               if (v->ignore || v->maybe_dead || v->mode != mode)
10357                 continue;
10358
10359               for (tv = REG_IV_CLASS (ivs, REGNO (arg))->giv; tv;
10360                    tv = tv->next_iv)
10361                 if (! tv->ignore && ! tv->maybe_dead
10362                     && rtx_equal_p (tv->mult_val, v->mult_val)
10363                     && rtx_equal_p (tv->add_val, v->add_val)
10364                     && tv->mode == mode)
10365                   {
10366                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
10367                       continue;
10368
10369                     if (! eliminate_p)
10370                       return 1;
10371
10372                     /* Replace biv with its giv's reduced reg.  */
10373                     XEXP (x, 1 - arg_operand) = v->new_reg;
10374                     /* Replace other operand with the other giv's
10375                        reduced reg.  */
10376                     XEXP (x, arg_operand) = tv->new_reg;
10377                     return 1;
10378                   }
10379             }
10380 #endif
10381         }
10382
10383       /* If we get here, the biv can't be eliminated.  */
10384       return 0;
10385
10386     case MEM:
10387       /* If this address is a DEST_ADDR giv, it doesn't matter if the
10388          biv is used in it, since it will be replaced.  */
10389       for (v = bl->giv; v; v = v->next_iv)
10390         if (v->giv_type == DEST_ADDR && v->location == &XEXP (x, 0))
10391           return 1;
10392       break;
10393
10394     default:
10395       break;
10396     }
10397
10398   /* See if any subexpression fails elimination.  */
10399   fmt = GET_RTX_FORMAT (code);
10400   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
10401     {
10402       switch (fmt[i])
10403         {
10404         case 'e':
10405           if (! maybe_eliminate_biv_1 (loop, XEXP (x, i), insn, bl,
10406                                        eliminate_p, where_bb, where_insn))
10407             return 0;
10408           break;
10409
10410         case 'E':
10411           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
10412             if (! maybe_eliminate_biv_1 (loop, XVECEXP (x, i, j), insn, bl,
10413                                          eliminate_p, where_bb, where_insn))
10414               return 0;
10415           break;
10416         }
10417     }
10418
10419   return 1;
10420 }
10421 \f
10422 /* Return nonzero if the last use of REG
10423    is in an insn following INSN in the same basic block.  */
10424
10425 static int
10426 last_use_this_basic_block (rtx reg, rtx insn)
10427 {
10428   rtx n;
10429   for (n = insn;
10430        n && !LABEL_P (n) && !JUMP_P (n);
10431        n = NEXT_INSN (n))
10432     {
10433       if (REGNO_LAST_UID (REGNO (reg)) == INSN_UID (n))
10434         return 1;
10435     }
10436   return 0;
10437 }
10438 \f
10439 /* Called via `note_stores' to record the initial value of a biv.  Here we
10440    just record the location of the set and process it later.  */
10441
10442 static void
10443 record_initial (rtx dest, rtx set, void *data ATTRIBUTE_UNUSED)
10444 {
10445   struct loop_ivs *ivs = (struct loop_ivs *) data;
10446   struct iv_class *bl;
10447
10448   if (!REG_P (dest)
10449       || REGNO (dest) >= ivs->n_regs
10450       || REG_IV_TYPE (ivs, REGNO (dest)) != BASIC_INDUCT)
10451     return;
10452
10453   bl = REG_IV_CLASS (ivs, REGNO (dest));
10454
10455   /* If this is the first set found, record it.  */
10456   if (bl->init_insn == 0)
10457     {
10458       bl->init_insn = note_insn;
10459       bl->init_set = set;
10460     }
10461 }
10462 \f
10463 /* If any of the registers in X are "old" and currently have a last use earlier
10464    than INSN, update them to have a last use of INSN.  Their actual last use
10465    will be the previous insn but it will not have a valid uid_luid so we can't
10466    use it.  X must be a source expression only.  */
10467
10468 static void
10469 update_reg_last_use (rtx x, rtx insn)
10470 {
10471   /* Check for the case where INSN does not have a valid luid.  In this case,
10472      there is no need to modify the regno_last_uid, as this can only happen
10473      when code is inserted after the loop_end to set a pseudo's final value,
10474      and hence this insn will never be the last use of x.
10475      ???? This comment is not correct.  See for example loop_givs_reduce.
10476      This may insert an insn before another new insn.  */
10477   if (REG_P (x) && REGNO (x) < max_reg_before_loop
10478       && INSN_UID (insn) < max_uid_for_loop
10479       && REGNO_LAST_LUID (REGNO (x)) < INSN_LUID (insn))
10480     {
10481       REGNO_LAST_UID (REGNO (x)) = INSN_UID (insn);
10482     }
10483   else
10484     {
10485       int i, j;
10486       const char *fmt = GET_RTX_FORMAT (GET_CODE (x));
10487       for (i = GET_RTX_LENGTH (GET_CODE (x)) - 1; i >= 0; i--)
10488         {
10489           if (fmt[i] == 'e')
10490             update_reg_last_use (XEXP (x, i), insn);
10491           else if (fmt[i] == 'E')
10492             for (j = XVECLEN (x, i) - 1; j >= 0; j--)
10493               update_reg_last_use (XVECEXP (x, i, j), insn);
10494         }
10495     }
10496 }
10497 \f
10498 /* Similar to rtlanal.c:get_condition, except that we also put an
10499    invariant last unless both operands are invariants.  */
10500
10501 static rtx
10502 get_condition_for_loop (const struct loop *loop, rtx x)
10503 {
10504   rtx comparison = get_condition (x, (rtx*) 0, false, true);
10505
10506   if (comparison == 0
10507       || ! loop_invariant_p (loop, XEXP (comparison, 0))
10508       || loop_invariant_p (loop, XEXP (comparison, 1)))
10509     return comparison;
10510
10511   return gen_rtx_fmt_ee (swap_condition (GET_CODE (comparison)), VOIDmode,
10512                          XEXP (comparison, 1), XEXP (comparison, 0));
10513 }
10514
10515 /* Scan the function and determine whether it has indirect (computed) jumps.
10516
10517    This is taken mostly from flow.c; similar code exists elsewhere
10518    in the compiler.  It may be useful to put this into rtlanal.c.  */
10519 static int
10520 indirect_jump_in_function_p (rtx start)
10521 {
10522   rtx insn;
10523
10524   for (insn = start; insn; insn = NEXT_INSN (insn))
10525     if (computed_jump_p (insn))
10526       return 1;
10527
10528   return 0;
10529 }
10530
10531 /* Add MEM to the LOOP_MEMS array, if appropriate.  See the
10532    documentation for LOOP_MEMS for the definition of `appropriate'.
10533    This function is called from prescan_loop via for_each_rtx.  */
10534
10535 static int
10536 insert_loop_mem (rtx *mem, void *data ATTRIBUTE_UNUSED)
10537 {
10538   struct loop_info *loop_info = data;
10539   int i;
10540   rtx m = *mem;
10541
10542   if (m == NULL_RTX)
10543     return 0;
10544
10545   switch (GET_CODE (m))
10546     {
10547     case MEM:
10548       break;
10549
10550     case CLOBBER:
10551       /* We're not interested in MEMs that are only clobbered.  */
10552       return -1;
10553
10554     case CONST_DOUBLE:
10555       /* We're not interested in the MEM associated with a
10556          CONST_DOUBLE, so there's no need to traverse into this.  */
10557       return -1;
10558
10559     case EXPR_LIST:
10560       /* We're not interested in any MEMs that only appear in notes.  */
10561       return -1;
10562
10563     default:
10564       /* This is not a MEM.  */
10565       return 0;
10566     }
10567
10568   /* See if we've already seen this MEM.  */
10569   for (i = 0; i < loop_info->mems_idx; ++i)
10570     if (rtx_equal_p (m, loop_info->mems[i].mem))
10571       {
10572         if (MEM_VOLATILE_P (m) && !MEM_VOLATILE_P (loop_info->mems[i].mem))
10573           loop_info->mems[i].mem = m;
10574         if (GET_MODE (m) != GET_MODE (loop_info->mems[i].mem))
10575           /* The modes of the two memory accesses are different.  If
10576              this happens, something tricky is going on, and we just
10577              don't optimize accesses to this MEM.  */
10578           loop_info->mems[i].optimize = 0;
10579
10580         return 0;
10581       }
10582
10583   /* Resize the array, if necessary.  */
10584   if (loop_info->mems_idx == loop_info->mems_allocated)
10585     {
10586       if (loop_info->mems_allocated != 0)
10587         loop_info->mems_allocated *= 2;
10588       else
10589         loop_info->mems_allocated = 32;
10590
10591       loop_info->mems = xrealloc (loop_info->mems,
10592                                   loop_info->mems_allocated * sizeof (loop_mem_info));
10593     }
10594
10595   /* Actually insert the MEM.  */
10596   loop_info->mems[loop_info->mems_idx].mem = m;
10597   /* We can't hoist this MEM out of the loop if it's a BLKmode MEM
10598      because we can't put it in a register.  We still store it in the
10599      table, though, so that if we see the same address later, but in a
10600      non-BLK mode, we'll not think we can optimize it at that point.  */
10601   loop_info->mems[loop_info->mems_idx].optimize = (GET_MODE (m) != BLKmode);
10602   loop_info->mems[loop_info->mems_idx].reg = NULL_RTX;
10603   ++loop_info->mems_idx;
10604
10605   return 0;
10606 }
10607
10608
10609 /* Allocate REGS->ARRAY or reallocate it if it is too small.
10610
10611    Increment REGS->ARRAY[I].SET_IN_LOOP at the index I of each
10612    register that is modified by an insn between FROM and TO.  If the
10613    value of an element of REGS->array[I].SET_IN_LOOP becomes 127 or
10614    more, stop incrementing it, to avoid overflow.
10615
10616    Store in REGS->ARRAY[I].SINGLE_USAGE the single insn in which
10617    register I is used, if it is only used once.  Otherwise, it is set
10618    to 0 (for no uses) or const0_rtx for more than one use.  This
10619    parameter may be zero, in which case this processing is not done.
10620
10621    Set REGS->ARRAY[I].MAY_NOT_OPTIMIZE nonzero if we should not
10622    optimize register I.  */
10623
10624 static void
10625 loop_regs_scan (const struct loop *loop, int extra_size)
10626 {
10627   struct loop_regs *regs = LOOP_REGS (loop);
10628   int old_nregs;
10629   /* last_set[n] is nonzero iff reg n has been set in the current
10630    basic block.  In that case, it is the insn that last set reg n.  */
10631   rtx *last_set;
10632   rtx insn;
10633   int i;
10634
10635   old_nregs = regs->num;
10636   regs->num = max_reg_num ();
10637
10638   /* Grow the regs array if not allocated or too small.  */
10639   if (regs->num >= regs->size)
10640     {
10641       regs->size = regs->num + extra_size;
10642
10643       regs->array = xrealloc (regs->array, regs->size * sizeof (*regs->array));
10644
10645       /* Zero the new elements.  */
10646       memset (regs->array + old_nregs, 0,
10647               (regs->size - old_nregs) * sizeof (*regs->array));
10648     }
10649
10650   /* Clear previously scanned fields but do not clear n_times_set.  */
10651   for (i = 0; i < old_nregs; i++)
10652     {
10653       regs->array[i].set_in_loop = 0;
10654       regs->array[i].may_not_optimize = 0;
10655       regs->array[i].single_usage = NULL_RTX;
10656     }
10657
10658   last_set = xcalloc (regs->num, sizeof (rtx));
10659
10660   /* Scan the loop, recording register usage.  */
10661   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
10662        insn = NEXT_INSN (insn))
10663     {
10664       if (INSN_P (insn))
10665         {
10666           /* Record registers that have exactly one use.  */
10667           find_single_use_in_loop (regs, insn, PATTERN (insn));
10668
10669           /* Include uses in REG_EQUAL notes.  */
10670           if (REG_NOTES (insn))
10671             find_single_use_in_loop (regs, insn, REG_NOTES (insn));
10672
10673           if (GET_CODE (PATTERN (insn)) == SET
10674               || GET_CODE (PATTERN (insn)) == CLOBBER)
10675             count_one_set (regs, insn, PATTERN (insn), last_set);
10676           else if (GET_CODE (PATTERN (insn)) == PARALLEL)
10677             {
10678               int i;
10679               for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
10680                 count_one_set (regs, insn, XVECEXP (PATTERN (insn), 0, i),
10681                                last_set);
10682             }
10683         }
10684
10685       if (LABEL_P (insn) || JUMP_P (insn))
10686         memset (last_set, 0, regs->num * sizeof (rtx));
10687
10688       /* Invalidate all registers used for function argument passing.
10689          We check rtx_varies_p for the same reason as below, to allow
10690          optimizing PIC calculations.  */
10691       if (CALL_P (insn))
10692         {
10693           rtx link;
10694           for (link = CALL_INSN_FUNCTION_USAGE (insn);
10695                link;
10696                link = XEXP (link, 1))
10697             {
10698               rtx op, reg;
10699
10700               if (GET_CODE (op = XEXP (link, 0)) == USE
10701                   && REG_P (reg = XEXP (op, 0))
10702                   && rtx_varies_p (reg, 1))
10703                 regs->array[REGNO (reg)].may_not_optimize = 1;
10704             }
10705         }
10706     }
10707
10708   /* Invalidate all hard registers clobbered by calls.  With one exception:
10709      a call-clobbered PIC register is still function-invariant for our
10710      purposes, since we can hoist any PIC calculations out of the loop.
10711      Thus the call to rtx_varies_p.  */
10712   if (LOOP_INFO (loop)->has_call)
10713     for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
10714       if (TEST_HARD_REG_BIT (regs_invalidated_by_call, i)
10715           && rtx_varies_p (regno_reg_rtx[i], 1))
10716         {
10717           regs->array[i].may_not_optimize = 1;
10718           regs->array[i].set_in_loop = 1;
10719         }
10720
10721 #ifdef AVOID_CCMODE_COPIES
10722   /* Don't try to move insns which set CC registers if we should not
10723      create CCmode register copies.  */
10724   for (i = regs->num - 1; i >= FIRST_PSEUDO_REGISTER; i--)
10725     if (GET_MODE_CLASS (GET_MODE (regno_reg_rtx[i])) == MODE_CC)
10726       regs->array[i].may_not_optimize = 1;
10727 #endif
10728
10729   /* Set regs->array[I].n_times_set for the new registers.  */
10730   for (i = old_nregs; i < regs->num; i++)
10731     regs->array[i].n_times_set = regs->array[i].set_in_loop;
10732
10733   free (last_set);
10734 }
10735
10736 /* Returns the number of real INSNs in the LOOP.  */
10737
10738 static int
10739 count_insns_in_loop (const struct loop *loop)
10740 {
10741   int count = 0;
10742   rtx insn;
10743
10744   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
10745        insn = NEXT_INSN (insn))
10746     if (INSN_P (insn))
10747       ++count;
10748
10749   return count;
10750 }
10751
10752 /* Move MEMs into registers for the duration of the loop.  */
10753
10754 static void
10755 load_mems (const struct loop *loop)
10756 {
10757   struct loop_info *loop_info = LOOP_INFO (loop);
10758   struct loop_regs *regs = LOOP_REGS (loop);
10759   int maybe_never = 0;
10760   int i;
10761   rtx p, prev_ebb_head;
10762   rtx label = NULL_RTX;
10763   rtx end_label;
10764   /* Nonzero if the next instruction may never be executed.  */
10765   int next_maybe_never = 0;
10766   unsigned int last_max_reg = max_reg_num ();
10767
10768   if (loop_info->mems_idx == 0)
10769     return;
10770
10771   /* We cannot use next_label here because it skips over normal insns.  */
10772   end_label = next_nonnote_insn (loop->end);
10773   if (end_label && !LABEL_P (end_label))
10774     end_label = NULL_RTX;
10775
10776   /* Check to see if it's possible that some instructions in the loop are
10777      never executed.  Also check if there is a goto out of the loop other
10778      than right after the end of the loop.  */
10779   for (p = next_insn_in_loop (loop, loop->scan_start);
10780        p != NULL_RTX;
10781        p = next_insn_in_loop (loop, p))
10782     {
10783       if (LABEL_P (p))
10784         maybe_never = 1;
10785       else if (JUMP_P (p)
10786                /* If we enter the loop in the middle, and scan
10787                   around to the beginning, don't set maybe_never
10788                   for that.  This must be an unconditional jump,
10789                   otherwise the code at the top of the loop might
10790                   never be executed.  Unconditional jumps are
10791                   followed a by barrier then loop end.  */
10792                && ! (JUMP_P (p)
10793                      && JUMP_LABEL (p) == loop->top
10794                      && NEXT_INSN (NEXT_INSN (p)) == loop->end
10795                      && any_uncondjump_p (p)))
10796         {
10797           /* If this is a jump outside of the loop but not right
10798              after the end of the loop, we would have to emit new fixup
10799              sequences for each such label.  */
10800           if (/* If we can't tell where control might go when this
10801                  JUMP_INSN is executed, we must be conservative.  */
10802               !JUMP_LABEL (p)
10803               || (JUMP_LABEL (p) != end_label
10804                   && (INSN_UID (JUMP_LABEL (p)) >= max_uid_for_loop
10805                       || INSN_LUID (JUMP_LABEL (p)) < INSN_LUID (loop->start)
10806                       || INSN_LUID (JUMP_LABEL (p)) > INSN_LUID (loop->end))))
10807             return;
10808
10809           if (!any_condjump_p (p))
10810             /* Something complicated.  */
10811             maybe_never = 1;
10812           else
10813             /* If there are any more instructions in the loop, they
10814                might not be reached.  */
10815             next_maybe_never = 1;
10816         }
10817       else if (next_maybe_never)
10818         maybe_never = 1;
10819     }
10820
10821   /* Find start of the extended basic block that enters the loop.  */
10822   for (p = loop->start;
10823        PREV_INSN (p) && !LABEL_P (p);
10824        p = PREV_INSN (p))
10825     ;
10826   prev_ebb_head = p;
10827
10828   cselib_init (true);
10829
10830   /* Build table of mems that get set to constant values before the
10831      loop.  */
10832   for (; p != loop->start; p = NEXT_INSN (p))
10833     cselib_process_insn (p);
10834
10835   /* Actually move the MEMs.  */
10836   for (i = 0; i < loop_info->mems_idx; ++i)
10837     {
10838       regset_head load_copies;
10839       regset_head store_copies;
10840       int written = 0;
10841       rtx reg;
10842       rtx mem = loop_info->mems[i].mem;
10843       rtx mem_list_entry;
10844
10845       if (MEM_VOLATILE_P (mem)
10846           || loop_invariant_p (loop, XEXP (mem, 0)) != 1)
10847         /* There's no telling whether or not MEM is modified.  */
10848         loop_info->mems[i].optimize = 0;
10849
10850       /* Go through the MEMs written to in the loop to see if this
10851          one is aliased by one of them.  */
10852       mem_list_entry = loop_info->store_mems;
10853       while (mem_list_entry)
10854         {
10855           if (rtx_equal_p (mem, XEXP (mem_list_entry, 0)))
10856             written = 1;
10857           else if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
10858                                     mem, rtx_varies_p))
10859             {
10860               /* MEM is indeed aliased by this store.  */
10861               loop_info->mems[i].optimize = 0;
10862               break;
10863             }
10864           mem_list_entry = XEXP (mem_list_entry, 1);
10865         }
10866
10867       if (flag_float_store && written
10868           && GET_MODE_CLASS (GET_MODE (mem)) == MODE_FLOAT)
10869         loop_info->mems[i].optimize = 0;
10870
10871       /* If this MEM is written to, we must be sure that there
10872          are no reads from another MEM that aliases this one.  */
10873       if (loop_info->mems[i].optimize && written)
10874         {
10875           int j;
10876
10877           for (j = 0; j < loop_info->mems_idx; ++j)
10878             {
10879               if (j == i)
10880                 continue;
10881               else if (true_dependence (mem,
10882                                         VOIDmode,
10883                                         loop_info->mems[j].mem,
10884                                         rtx_varies_p))
10885                 {
10886                   /* It's not safe to hoist loop_info->mems[i] out of
10887                      the loop because writes to it might not be
10888                      seen by reads from loop_info->mems[j].  */
10889                   loop_info->mems[i].optimize = 0;
10890                   break;
10891                 }
10892             }
10893         }
10894
10895       if (maybe_never && may_trap_p (mem))
10896         /* We can't access the MEM outside the loop; it might
10897            cause a trap that wouldn't have happened otherwise.  */
10898         loop_info->mems[i].optimize = 0;
10899
10900       if (!loop_info->mems[i].optimize)
10901         /* We thought we were going to lift this MEM out of the
10902            loop, but later discovered that we could not.  */
10903         continue;
10904
10905       INIT_REG_SET (&load_copies);
10906       INIT_REG_SET (&store_copies);
10907
10908       /* Allocate a pseudo for this MEM.  We set REG_USERVAR_P in
10909          order to keep scan_loop from moving stores to this MEM
10910          out of the loop just because this REG is neither a
10911          user-variable nor used in the loop test.  */
10912       reg = gen_reg_rtx (GET_MODE (mem));
10913       REG_USERVAR_P (reg) = 1;
10914       loop_info->mems[i].reg = reg;
10915
10916       /* Now, replace all references to the MEM with the
10917          corresponding pseudos.  */
10918       maybe_never = 0;
10919       for (p = next_insn_in_loop (loop, loop->scan_start);
10920            p != NULL_RTX;
10921            p = next_insn_in_loop (loop, p))
10922         {
10923           if (INSN_P (p))
10924             {
10925               rtx set;
10926
10927               set = single_set (p);
10928
10929               /* See if this copies the mem into a register that isn't
10930                  modified afterwards.  We'll try to do copy propagation
10931                  a little further on.  */
10932               if (set
10933                   /* @@@ This test is _way_ too conservative.  */
10934                   && ! maybe_never
10935                   && REG_P (SET_DEST (set))
10936                   && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER
10937                   && REGNO (SET_DEST (set)) < last_max_reg
10938                   && regs->array[REGNO (SET_DEST (set))].n_times_set == 1
10939                   && rtx_equal_p (SET_SRC (set), mem))
10940                 SET_REGNO_REG_SET (&load_copies, REGNO (SET_DEST (set)));
10941
10942               /* See if this copies the mem from a register that isn't
10943                  modified afterwards.  We'll try to remove the
10944                  redundant copy later on by doing a little register
10945                  renaming and copy propagation.   This will help
10946                  to untangle things for the BIV detection code.  */
10947               if (set
10948                   && ! maybe_never
10949                   && REG_P (SET_SRC (set))
10950                   && REGNO (SET_SRC (set)) >= FIRST_PSEUDO_REGISTER
10951                   && REGNO (SET_SRC (set)) < last_max_reg
10952                   && regs->array[REGNO (SET_SRC (set))].n_times_set == 1
10953                   && rtx_equal_p (SET_DEST (set), mem))
10954                 SET_REGNO_REG_SET (&store_copies, REGNO (SET_SRC (set)));
10955
10956               /* If this is a call which uses / clobbers this memory
10957                  location, we must not change the interface here.  */
10958               if (CALL_P (p)
10959                   && reg_mentioned_p (loop_info->mems[i].mem,
10960                                       CALL_INSN_FUNCTION_USAGE (p)))
10961                 {
10962                   cancel_changes (0);
10963                   loop_info->mems[i].optimize = 0;
10964                   break;
10965                 }
10966               else
10967                 /* Replace the memory reference with the shadow register.  */
10968                 replace_loop_mems (p, loop_info->mems[i].mem,
10969                                    loop_info->mems[i].reg, written);
10970             }
10971
10972           if (LABEL_P (p)
10973               || JUMP_P (p))
10974             maybe_never = 1;
10975         }
10976
10977       if (! loop_info->mems[i].optimize)
10978         ; /* We found we couldn't do the replacement, so do nothing.  */
10979       else if (! apply_change_group ())
10980         /* We couldn't replace all occurrences of the MEM.  */
10981         loop_info->mems[i].optimize = 0;
10982       else
10983         {
10984           /* Load the memory immediately before LOOP->START, which is
10985              the NOTE_LOOP_BEG.  */
10986           cselib_val *e = cselib_lookup (mem, VOIDmode, 0);
10987           rtx set;
10988           rtx best = mem;
10989           unsigned j;
10990           struct elt_loc_list *const_equiv = 0;
10991           reg_set_iterator rsi;
10992
10993           if (e)
10994             {
10995               struct elt_loc_list *equiv;
10996               struct elt_loc_list *best_equiv = 0;
10997               for (equiv = e->locs; equiv; equiv = equiv->next)
10998                 {
10999                   if (CONSTANT_P (equiv->loc))
11000                     const_equiv = equiv;
11001                   else if (REG_P (equiv->loc)
11002                            /* Extending hard register lifetimes causes crash
11003                               on SRC targets.  Doing so on non-SRC is
11004                               probably also not good idea, since we most
11005                               probably have pseudoregister equivalence as
11006                               well.  */
11007                            && REGNO (equiv->loc) >= FIRST_PSEUDO_REGISTER)
11008                     best_equiv = equiv;
11009                 }
11010               /* Use the constant equivalence if that is cheap enough.  */
11011               if (! best_equiv)
11012                 best_equiv = const_equiv;
11013               else if (const_equiv
11014                        && (rtx_cost (const_equiv->loc, SET)
11015                            <= rtx_cost (best_equiv->loc, SET)))
11016                 {
11017                   best_equiv = const_equiv;
11018                   const_equiv = 0;
11019                 }
11020
11021               /* If best_equiv is nonzero, we know that MEM is set to a
11022                  constant or register before the loop.  We will use this
11023                  knowledge to initialize the shadow register with that
11024                  constant or reg rather than by loading from MEM.  */
11025               if (best_equiv)
11026                 best = copy_rtx (best_equiv->loc);
11027             }
11028
11029           set = gen_move_insn (reg, best);
11030           set = loop_insn_hoist (loop, set);
11031           if (REG_P (best))
11032             {
11033               for (p = prev_ebb_head; p != loop->start; p = NEXT_INSN (p))
11034                 if (REGNO_LAST_UID (REGNO (best)) == INSN_UID (p))
11035                   {
11036                     REGNO_LAST_UID (REGNO (best)) = INSN_UID (set);
11037                     break;
11038                   }
11039             }
11040
11041           if (const_equiv)
11042             set_unique_reg_note (set, REG_EQUAL, copy_rtx (const_equiv->loc));
11043
11044           if (written)
11045             {
11046               if (label == NULL_RTX)
11047                 {
11048                   label = gen_label_rtx ();
11049                   emit_label_after (label, loop->end);
11050                 }
11051
11052               /* Store the memory immediately after END, which is
11053                  the NOTE_LOOP_END.  */
11054               set = gen_move_insn (copy_rtx (mem), reg);
11055               loop_insn_emit_after (loop, 0, label, set);
11056             }
11057
11058           if (loop_dump_stream)
11059             {
11060               fprintf (loop_dump_stream, "Hoisted regno %d %s from ",
11061                        REGNO (reg), (written ? "r/w" : "r/o"));
11062               print_rtl (loop_dump_stream, mem);
11063               fputc ('\n', loop_dump_stream);
11064             }
11065
11066           /* Attempt a bit of copy propagation.  This helps untangle the
11067              data flow, and enables {basic,general}_induction_var to find
11068              more bivs/givs.  */
11069           EXECUTE_IF_SET_IN_REG_SET
11070             (&load_copies, FIRST_PSEUDO_REGISTER, j, rsi)
11071             {
11072               try_copy_prop (loop, reg, j);
11073             }
11074           CLEAR_REG_SET (&load_copies);
11075
11076           EXECUTE_IF_SET_IN_REG_SET
11077             (&store_copies, FIRST_PSEUDO_REGISTER, j, rsi)
11078             {
11079               try_swap_copy_prop (loop, reg, j);
11080             }
11081           CLEAR_REG_SET (&store_copies);
11082         }
11083     }
11084
11085   /* Now, we need to replace all references to the previous exit
11086      label with the new one.  */
11087   if (label != NULL_RTX && end_label != NULL_RTX)
11088     for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
11089       if (JUMP_P (p) && JUMP_LABEL (p) == end_label)
11090         redirect_jump (p, label, false);
11091
11092   cselib_finish ();
11093 }
11094
11095 /* For communication between note_reg_stored and its caller.  */
11096 struct note_reg_stored_arg
11097 {
11098   int set_seen;
11099   rtx reg;
11100 };
11101
11102 /* Called via note_stores, record in SET_SEEN whether X, which is written,
11103    is equal to ARG.  */
11104 static void
11105 note_reg_stored (rtx x, rtx setter ATTRIBUTE_UNUSED, void *arg)
11106 {
11107   struct note_reg_stored_arg *t = (struct note_reg_stored_arg *) arg;
11108   if (t->reg == x)
11109     t->set_seen = 1;
11110 }
11111
11112 /* Try to replace every occurrence of pseudo REGNO with REPLACEMENT.
11113    There must be exactly one insn that sets this pseudo; it will be
11114    deleted if all replacements succeed and we can prove that the register
11115    is not used after the loop.  */
11116
11117 static void
11118 try_copy_prop (const struct loop *loop, rtx replacement, unsigned int regno)
11119 {
11120   /* This is the reg that we are copying from.  */
11121   rtx reg_rtx = regno_reg_rtx[regno];
11122   rtx init_insn = 0;
11123   rtx insn;
11124   /* These help keep track of whether we replaced all uses of the reg.  */
11125   int replaced_last = 0;
11126   int store_is_first = 0;
11127
11128   for (insn = next_insn_in_loop (loop, loop->scan_start);
11129        insn != NULL_RTX;
11130        insn = next_insn_in_loop (loop, insn))
11131     {
11132       rtx set;
11133
11134       /* Only substitute within one extended basic block from the initializing
11135          insn.  */
11136       if (LABEL_P (insn) && init_insn)
11137         break;
11138
11139       if (! INSN_P (insn))
11140         continue;
11141
11142       /* Is this the initializing insn?  */
11143       set = single_set (insn);
11144       if (set
11145           && REG_P (SET_DEST (set))
11146           && REGNO (SET_DEST (set)) == regno)
11147         {
11148           gcc_assert (!init_insn);
11149
11150           init_insn = insn;
11151           if (REGNO_FIRST_UID (regno) == INSN_UID (insn))
11152             store_is_first = 1;
11153         }
11154
11155       /* Only substitute after seeing the initializing insn.  */
11156       if (init_insn && insn != init_insn)
11157         {
11158           struct note_reg_stored_arg arg;
11159
11160           replace_loop_regs (insn, reg_rtx, replacement);
11161           if (REGNO_LAST_UID (regno) == INSN_UID (insn))
11162             replaced_last = 1;
11163
11164           /* Stop replacing when REPLACEMENT is modified.  */
11165           arg.reg = replacement;
11166           arg.set_seen = 0;
11167           note_stores (PATTERN (insn), note_reg_stored, &arg);
11168           if (arg.set_seen)
11169             {
11170               rtx note = find_reg_note (insn, REG_EQUAL, NULL);
11171
11172               /* It is possible that we've turned previously valid REG_EQUAL to
11173                  invalid, as we change the REGNO to REPLACEMENT and unlike REGNO,
11174                  REPLACEMENT is modified, we get different meaning.  */
11175               if (note && reg_mentioned_p (replacement, XEXP (note, 0)))
11176                 remove_note (insn, note);
11177               break;
11178             }
11179         }
11180     }
11181   gcc_assert (init_insn);
11182   if (apply_change_group ())
11183     {
11184       if (loop_dump_stream)
11185         fprintf (loop_dump_stream, "  Replaced reg %d", regno);
11186       if (store_is_first && replaced_last)
11187         {
11188           rtx first;
11189           rtx retval_note;
11190
11191           /* Assume we're just deleting INIT_INSN.  */
11192           first = init_insn;
11193           /* Look for REG_RETVAL note.  If we're deleting the end of
11194              the libcall sequence, the whole sequence can go.  */
11195           retval_note = find_reg_note (init_insn, REG_RETVAL, NULL_RTX);
11196           /* If we found a REG_RETVAL note, find the first instruction
11197              in the sequence.  */
11198           if (retval_note)
11199             first = XEXP (retval_note, 0);
11200
11201           /* Delete the instructions.  */
11202           loop_delete_insns (first, init_insn);
11203         }
11204       if (loop_dump_stream)
11205         fprintf (loop_dump_stream, ".\n");
11206     }
11207 }
11208
11209 /* Replace all the instructions from FIRST up to and including LAST
11210    with NOTE_INSN_DELETED notes.  */
11211
11212 static void
11213 loop_delete_insns (rtx first, rtx last)
11214 {
11215   while (1)
11216     {
11217       if (loop_dump_stream)
11218         fprintf (loop_dump_stream, ", deleting init_insn (%d)",
11219                  INSN_UID (first));
11220       delete_insn (first);
11221
11222       /* If this was the LAST instructions we're supposed to delete,
11223          we're done.  */
11224       if (first == last)
11225         break;
11226
11227       first = NEXT_INSN (first);
11228     }
11229 }
11230
11231 /* Try to replace occurrences of pseudo REGNO with REPLACEMENT within
11232    loop LOOP if the order of the sets of these registers can be
11233    swapped.  There must be exactly one insn within the loop that sets
11234    this pseudo followed immediately by a move insn that sets
11235    REPLACEMENT with REGNO.  */
11236 static void
11237 try_swap_copy_prop (const struct loop *loop, rtx replacement,
11238                     unsigned int regno)
11239 {
11240   rtx insn;
11241   rtx set = NULL_RTX;
11242   unsigned int new_regno;
11243
11244   new_regno = REGNO (replacement);
11245
11246   for (insn = next_insn_in_loop (loop, loop->scan_start);
11247        insn != NULL_RTX;
11248        insn = next_insn_in_loop (loop, insn))
11249     {
11250       /* Search for the insn that copies REGNO to NEW_REGNO?  */
11251       if (INSN_P (insn)
11252           && (set = single_set (insn))
11253           && REG_P (SET_DEST (set))
11254           && REGNO (SET_DEST (set)) == new_regno
11255           && REG_P (SET_SRC (set))
11256           && REGNO (SET_SRC (set)) == regno)
11257         break;
11258     }
11259
11260   if (insn != NULL_RTX)
11261     {
11262       rtx prev_insn;
11263       rtx prev_set;
11264
11265       /* Some DEF-USE info would come in handy here to make this
11266          function more general.  For now, just check the previous insn
11267          which is the most likely candidate for setting REGNO.  */
11268
11269       prev_insn = PREV_INSN (insn);
11270
11271       if (INSN_P (insn)
11272           && (prev_set = single_set (prev_insn))
11273           && REG_P (SET_DEST (prev_set))
11274           && REGNO (SET_DEST (prev_set)) == regno)
11275         {
11276           /* We have:
11277              (set (reg regno) (expr))
11278              (set (reg new_regno) (reg regno))
11279
11280              so try converting this to:
11281              (set (reg new_regno) (expr))
11282              (set (reg regno) (reg new_regno))
11283
11284              The former construct is often generated when a global
11285              variable used for an induction variable is shadowed by a
11286              register (NEW_REGNO).  The latter construct improves the
11287              chances of GIV replacement and BIV elimination.  */
11288
11289           validate_change (prev_insn, &SET_DEST (prev_set),
11290                            replacement, 1);
11291           validate_change (insn, &SET_DEST (set),
11292                            SET_SRC (set), 1);
11293           validate_change (insn, &SET_SRC (set),
11294                            replacement, 1);
11295
11296           if (apply_change_group ())
11297             {
11298               if (loop_dump_stream)
11299                 fprintf (loop_dump_stream,
11300                          "  Swapped set of reg %d at %d with reg %d at %d.\n",
11301                          regno, INSN_UID (insn),
11302                          new_regno, INSN_UID (prev_insn));
11303
11304               /* Update first use of REGNO.  */
11305               if (REGNO_FIRST_UID (regno) == INSN_UID (prev_insn))
11306                 REGNO_FIRST_UID (regno) = INSN_UID (insn);
11307
11308               /* Now perform copy propagation to hopefully
11309                  remove all uses of REGNO within the loop.  */
11310               try_copy_prop (loop, replacement, regno);
11311             }
11312         }
11313     }
11314 }
11315
11316 /* Worker function for find_mem_in_note, called via for_each_rtx.  */
11317
11318 static int
11319 find_mem_in_note_1 (rtx *x, void *data)
11320 {
11321   if (*x != NULL_RTX && MEM_P (*x))
11322     {
11323       rtx *res = (rtx *) data;
11324       *res = *x;
11325       return 1;
11326     }
11327   return 0;
11328 }
11329
11330 /* Returns the first MEM found in NOTE by depth-first search.  */
11331
11332 static rtx
11333 find_mem_in_note (rtx note)
11334 {
11335   if (note && for_each_rtx (&note, find_mem_in_note_1, &note))
11336     return note;
11337   return NULL_RTX;
11338 }
11339
11340 /* Replace MEM with its associated pseudo register.  This function is
11341    called from load_mems via for_each_rtx.  DATA is actually a pointer
11342    to a structure describing the instruction currently being scanned
11343    and the MEM we are currently replacing.  */
11344
11345 static int
11346 replace_loop_mem (rtx *mem, void *data)
11347 {
11348   loop_replace_args *args = (loop_replace_args *) data;
11349   rtx m = *mem;
11350
11351   if (m == NULL_RTX)
11352     return 0;
11353
11354   switch (GET_CODE (m))
11355     {
11356     case MEM:
11357       break;
11358
11359     case CONST_DOUBLE:
11360       /* We're not interested in the MEM associated with a
11361          CONST_DOUBLE, so there's no need to traverse into one.  */
11362       return -1;
11363
11364     default:
11365       /* This is not a MEM.  */
11366       return 0;
11367     }
11368
11369   if (!rtx_equal_p (args->match, m))
11370     /* This is not the MEM we are currently replacing.  */
11371     return 0;
11372
11373   /* Actually replace the MEM.  */
11374   validate_change (args->insn, mem, args->replacement, 1);
11375
11376   return 0;
11377 }
11378
11379 static void
11380 replace_loop_mems (rtx insn, rtx mem, rtx reg, int written)
11381 {
11382   loop_replace_args args;
11383
11384   args.insn = insn;
11385   args.match = mem;
11386   args.replacement = reg;
11387
11388   for_each_rtx (&insn, replace_loop_mem, &args);
11389
11390   /* If we hoist a mem write out of the loop, then REG_EQUAL
11391      notes referring to the mem are no longer valid.  */
11392   if (written)
11393     {
11394       rtx note, sub;
11395       rtx *link;
11396
11397       for (link = &REG_NOTES (insn); (note = *link); link = &XEXP (note, 1))
11398         {
11399           if (REG_NOTE_KIND (note) == REG_EQUAL
11400               && (sub = find_mem_in_note (note))
11401               && true_dependence (mem, VOIDmode, sub, rtx_varies_p))
11402             {
11403               /* Remove the note.  */
11404               validate_change (NULL_RTX, link, XEXP (note, 1), 1);
11405               break;
11406             }
11407         }
11408     }
11409 }
11410
11411 /* Replace one register with another.  Called through for_each_rtx; PX points
11412    to the rtx being scanned.  DATA is actually a pointer to
11413    a structure of arguments.  */
11414
11415 static int
11416 replace_loop_reg (rtx *px, void *data)
11417 {
11418   rtx x = *px;
11419   loop_replace_args *args = (loop_replace_args *) data;
11420
11421   if (x == NULL_RTX)
11422     return 0;
11423
11424   if (x == args->match)
11425     validate_change (args->insn, px, args->replacement, 1);
11426
11427   return 0;
11428 }
11429
11430 static void
11431 replace_loop_regs (rtx insn, rtx reg, rtx replacement)
11432 {
11433   loop_replace_args args;
11434
11435   args.insn = insn;
11436   args.match = reg;
11437   args.replacement = replacement;
11438
11439   for_each_rtx (&insn, replace_loop_reg, &args);
11440 }
11441 \f
11442 /* Emit insn for PATTERN after WHERE_INSN in basic block WHERE_BB
11443    (ignored in the interim).  */
11444
11445 static rtx
11446 loop_insn_emit_after (const struct loop *loop ATTRIBUTE_UNUSED,
11447                       basic_block where_bb ATTRIBUTE_UNUSED, rtx where_insn,
11448                       rtx pattern)
11449 {
11450   return emit_insn_after (pattern, where_insn);
11451 }
11452
11453
11454 /* If WHERE_INSN is nonzero emit insn for PATTERN before WHERE_INSN
11455    in basic block WHERE_BB (ignored in the interim) within the loop
11456    otherwise hoist PATTERN into the loop pre-header.  */
11457
11458 static rtx
11459 loop_insn_emit_before (const struct loop *loop,
11460                        basic_block where_bb ATTRIBUTE_UNUSED,
11461                        rtx where_insn, rtx pattern)
11462 {
11463   if (! where_insn)
11464     return loop_insn_hoist (loop, pattern);
11465   return emit_insn_before (pattern, where_insn);
11466 }
11467
11468
11469 /* Emit call insn for PATTERN before WHERE_INSN in basic block
11470    WHERE_BB (ignored in the interim) within the loop.  */
11471
11472 static rtx
11473 loop_call_insn_emit_before (const struct loop *loop ATTRIBUTE_UNUSED,
11474                             basic_block where_bb ATTRIBUTE_UNUSED,
11475                             rtx where_insn, rtx pattern)
11476 {
11477   return emit_call_insn_before (pattern, where_insn);
11478 }
11479
11480
11481 /* Hoist insn for PATTERN into the loop pre-header.  */
11482
11483 static rtx
11484 loop_insn_hoist (const struct loop *loop, rtx pattern)
11485 {
11486   return loop_insn_emit_before (loop, 0, loop->start, pattern);
11487 }
11488
11489
11490 /* Hoist call insn for PATTERN into the loop pre-header.  */
11491
11492 static rtx
11493 loop_call_insn_hoist (const struct loop *loop, rtx pattern)
11494 {
11495   return loop_call_insn_emit_before (loop, 0, loop->start, pattern);
11496 }
11497
11498
11499 /* Sink insn for PATTERN after the loop end.  */
11500
11501 static rtx
11502 loop_insn_sink (const struct loop *loop, rtx pattern)
11503 {
11504   return loop_insn_emit_before (loop, 0, loop->sink, pattern);
11505 }
11506
11507 /* bl->final_value can be either general_operand or PLUS of general_operand
11508    and constant.  Emit sequence of instructions to load it into REG.  */
11509 static rtx
11510 gen_load_of_final_value (rtx reg, rtx final_value)
11511 {
11512   rtx seq;
11513   start_sequence ();
11514   final_value = force_operand (final_value, reg);
11515   if (final_value != reg)
11516     emit_move_insn (reg, final_value);
11517   seq = get_insns ();
11518   end_sequence ();
11519   return seq;
11520 }
11521
11522 /* If the loop has multiple exits, emit insn for PATTERN before the
11523    loop to ensure that it will always be executed no matter how the
11524    loop exits.  Otherwise, emit the insn for PATTERN after the loop,
11525    since this is slightly more efficient.  */
11526
11527 static rtx
11528 loop_insn_sink_or_swim (const struct loop *loop, rtx pattern)
11529 {
11530   if (loop->exit_count)
11531     return loop_insn_hoist (loop, pattern);
11532   else
11533     return loop_insn_sink (loop, pattern);
11534 }
11535 \f
11536 static void
11537 loop_ivs_dump (const struct loop *loop, FILE *file, int verbose)
11538 {
11539   struct iv_class *bl;
11540   int iv_num = 0;
11541
11542   if (! loop || ! file)
11543     return;
11544
11545   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
11546     iv_num++;
11547
11548   fprintf (file, "Loop %d: %d IV classes\n", loop->num, iv_num);
11549
11550   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
11551     {
11552       loop_iv_class_dump (bl, file, verbose);
11553       fputc ('\n', file);
11554     }
11555 }
11556
11557
11558 static void
11559 loop_iv_class_dump (const struct iv_class *bl, FILE *file,
11560                     int verbose ATTRIBUTE_UNUSED)
11561 {
11562   struct induction *v;
11563   rtx incr;
11564   int i;
11565
11566   if (! bl || ! file)
11567     return;
11568
11569   fprintf (file, "IV class for reg %d, benefit %d\n",
11570            bl->regno, bl->total_benefit);
11571
11572   fprintf (file, " Init insn %d", INSN_UID (bl->init_insn));
11573   if (bl->initial_value)
11574     {
11575       fprintf (file, ", init val: ");
11576       print_simple_rtl (file, bl->initial_value);
11577     }
11578   if (bl->initial_test)
11579     {
11580       fprintf (file, ", init test: ");
11581       print_simple_rtl (file, bl->initial_test);
11582     }
11583   fputc ('\n', file);
11584
11585   if (bl->final_value)
11586     {
11587       fprintf (file, " Final val: ");
11588       print_simple_rtl (file, bl->final_value);
11589       fputc ('\n', file);
11590     }
11591
11592   if ((incr = biv_total_increment (bl)))
11593     {
11594       fprintf (file, " Total increment: ");
11595       print_simple_rtl (file, incr);
11596       fputc ('\n', file);
11597     }
11598
11599   /* List the increments.  */
11600   for (i = 0, v = bl->biv; v; v = v->next_iv, i++)
11601     {
11602       fprintf (file, " Inc%d: insn %d, incr: ", i, INSN_UID (v->insn));
11603       print_simple_rtl (file, v->add_val);
11604       fputc ('\n', file);
11605     }
11606
11607   /* List the givs.  */
11608   for (i = 0, v = bl->giv; v; v = v->next_iv, i++)
11609     {
11610       fprintf (file, " Giv%d: insn %d, benefit %d, ",
11611                i, INSN_UID (v->insn), v->benefit);
11612       if (v->giv_type == DEST_ADDR)
11613         print_simple_rtl (file, v->mem);
11614       else
11615         print_simple_rtl (file, single_set (v->insn));
11616       fputc ('\n', file);
11617     }
11618 }
11619
11620
11621 static void
11622 loop_biv_dump (const struct induction *v, FILE *file, int verbose)
11623 {
11624   if (! v || ! file)
11625     return;
11626
11627   fprintf (file,
11628            "Biv %d: insn %d",
11629            REGNO (v->dest_reg), INSN_UID (v->insn));
11630   fprintf (file, " const ");
11631   print_simple_rtl (file, v->add_val);
11632
11633   if (verbose && v->final_value)
11634     {
11635       fputc ('\n', file);
11636       fprintf (file, " final ");
11637       print_simple_rtl (file, v->final_value);
11638     }
11639
11640   fputc ('\n', file);
11641 }
11642
11643
11644 static void
11645 loop_giv_dump (const struct induction *v, FILE *file, int verbose)
11646 {
11647   if (! v || ! file)
11648     return;
11649
11650   if (v->giv_type == DEST_REG)
11651     fprintf (file, "Giv %d: insn %d",
11652              REGNO (v->dest_reg), INSN_UID (v->insn));
11653   else
11654     fprintf (file, "Dest address: insn %d",
11655              INSN_UID (v->insn));
11656
11657   fprintf (file, " src reg %d benefit %d",
11658            REGNO (v->src_reg), v->benefit);
11659   fprintf (file, " lifetime %d",
11660            v->lifetime);
11661
11662   if (v->replaceable)
11663     fprintf (file, " replaceable");
11664
11665   if (v->no_const_addval)
11666     fprintf (file, " ncav");
11667
11668   if (v->ext_dependent)
11669     {
11670       switch (GET_CODE (v->ext_dependent))
11671         {
11672         case SIGN_EXTEND:
11673           fprintf (file, " ext se");
11674           break;
11675         case ZERO_EXTEND:
11676           fprintf (file, " ext ze");
11677           break;
11678         case TRUNCATE:
11679           fprintf (file, " ext tr");
11680           break;
11681         default:
11682           gcc_unreachable ();
11683         }
11684     }
11685
11686   fputc ('\n', file);
11687   fprintf (file, " mult ");
11688   print_simple_rtl (file, v->mult_val);
11689
11690   fputc ('\n', file);
11691   fprintf (file, " add  ");
11692   print_simple_rtl (file, v->add_val);
11693
11694   if (verbose && v->final_value)
11695     {
11696       fputc ('\n', file);
11697       fprintf (file, " final ");
11698       print_simple_rtl (file, v->final_value);
11699     }
11700
11701   fputc ('\n', file);
11702 }
11703
11704
11705 void
11706 debug_ivs (const struct loop *loop)
11707 {
11708   loop_ivs_dump (loop, stderr, 1);
11709 }
11710
11711
11712 void
11713 debug_iv_class (const struct iv_class *bl)
11714 {
11715   loop_iv_class_dump (bl, stderr, 1);
11716 }
11717
11718
11719 void
11720 debug_biv (const struct induction *v)
11721 {
11722   loop_biv_dump (v, stderr, 1);
11723 }
11724
11725
11726 void
11727 debug_giv (const struct induction *v)
11728 {
11729   loop_giv_dump (v, stderr, 1);
11730 }
11731
11732
11733 #define LOOP_BLOCK_NUM_1(INSN) \
11734 ((INSN) ? (BLOCK_FOR_INSN (INSN) ? BLOCK_NUM (INSN) : - 1) : -1)
11735
11736 /* The notes do not have an assigned block, so look at the next insn.  */
11737 #define LOOP_BLOCK_NUM(INSN) \
11738 ((INSN) ? (NOTE_P (INSN) \
11739             ? LOOP_BLOCK_NUM_1 (next_nonnote_insn (INSN)) \
11740             : LOOP_BLOCK_NUM_1 (INSN)) \
11741         : -1)
11742
11743 #define LOOP_INSN_UID(INSN) ((INSN) ? INSN_UID (INSN) : -1)
11744
11745 static void
11746 loop_dump_aux (const struct loop *loop, FILE *file,
11747                int verbose ATTRIBUTE_UNUSED)
11748 {
11749   rtx label;
11750
11751   if (! loop || ! file || !BB_HEAD (loop->first))
11752     return;
11753
11754   /* Print diagnostics to compare our concept of a loop with
11755      what the loop notes say.  */
11756   if (! PREV_INSN (BB_HEAD (loop->first))
11757       || !NOTE_P (PREV_INSN (BB_HEAD (loop->first)))
11758       || NOTE_LINE_NUMBER (PREV_INSN (BB_HEAD (loop->first)))
11759       != NOTE_INSN_LOOP_BEG)
11760     fprintf (file, ";;  No NOTE_INSN_LOOP_BEG at %d\n",
11761              INSN_UID (PREV_INSN (BB_HEAD (loop->first))));
11762   if (! NEXT_INSN (BB_END (loop->last))
11763       || !NOTE_P (NEXT_INSN (BB_END (loop->last)))
11764       || NOTE_LINE_NUMBER (NEXT_INSN (BB_END (loop->last)))
11765       != NOTE_INSN_LOOP_END)
11766     fprintf (file, ";;  No NOTE_INSN_LOOP_END at %d\n",
11767              INSN_UID (NEXT_INSN (BB_END (loop->last))));
11768
11769   if (loop->start)
11770     {
11771       fprintf (file,
11772                ";;  start %d (%d), end %d (%d)\n",
11773                LOOP_BLOCK_NUM (loop->start),
11774                LOOP_INSN_UID (loop->start),
11775                LOOP_BLOCK_NUM (loop->end),
11776                LOOP_INSN_UID (loop->end));
11777       fprintf (file, ";;  top %d (%d), scan start %d (%d)\n",
11778                LOOP_BLOCK_NUM (loop->top),
11779                LOOP_INSN_UID (loop->top),
11780                LOOP_BLOCK_NUM (loop->scan_start),
11781                LOOP_INSN_UID (loop->scan_start));
11782       fprintf (file, ";;  exit_count %d", loop->exit_count);
11783       if (loop->exit_count)
11784         {
11785           fputs (", labels:", file);
11786           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
11787             {
11788               fprintf (file, " %d ",
11789                        LOOP_INSN_UID (XEXP (label, 0)));
11790             }
11791         }
11792       fputs ("\n", file);
11793     }
11794 }
11795
11796 /* Call this function from the debugger to dump LOOP.  */
11797
11798 void
11799 debug_loop (const struct loop *loop)
11800 {
11801   flow_loop_dump (loop, stderr, loop_dump_aux, 1);
11802 }
11803
11804 /* Call this function from the debugger to dump LOOPS.  */
11805
11806 void
11807 debug_loops (const struct loops *loops)
11808 {
11809   flow_loops_dump (loops, stderr, loop_dump_aux, 1);
11810 }