2004-11-26 Paolo Carlini <pcarlini@suse.de>

[pf3gnuchains/gcc-fork.git] / gcc / expmed.c
diff --git a/gcc/expmed.c b/gcc/expmed.c

index bb24504..eeab02f 100644 (file)
--- a/gcc/expmed.c
+++ b/gcc/expmed.c
@@ -298,7 +298,7 @@ mode_for_extraction (enum extraction_pattern pattern, int opno)
        return MAX_MACHINE_MODE;
  
      default:
-      abort ();
+      gcc_unreachable ();
      }
  
    if (opno == -1)
@@ -338,6 +338,7 @@ store_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
    unsigned HOST_WIDE_INT bitpos = bitnum % unit;
    rtx op0 = str_rtx;
    int byte_offset;
+  rtx orig_value;
  
    enum machine_mode op_mode = mode_for_extraction (EP_insv, 3);
  
@@ -386,10 +387,9 @@ store_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
  
        /* We could handle this, but we should always be called with a pseudo
          for our targets and all insns should take them as outputs.  */
-      if (! (*insn_data[icode].operand[0].predicate) (dest, mode0)
-         || ! (*insn_data[icode].operand[1].predicate) (src, mode1)
-         || ! (*insn_data[icode].operand[2].predicate) (rtxpos, mode2))
-       abort ();
+      gcc_assert ((*insn_data[icode].operand[0].predicate) (dest, mode0)
+                 && (*insn_data[icode].operand[1].predicate) (src, mode1)
+                 && (*insn_data[icode].operand[2].predicate) (rtxpos, mode2));
        pat = GEN_FCN (icode) (dest, src, rtxpos);
        seq = get_insns ();
        end_sequence ();
@@ -433,15 +433,14 @@ store_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
         {
           if (GET_CODE (op0) == SUBREG)
             {
-             if (GET_MODE (SUBREG_REG (op0)) == fieldmode
-                 || GET_MODE_CLASS (fieldmode) == MODE_INT
-                 || GET_MODE_CLASS (fieldmode) == MODE_PARTIAL_INT)
-               op0 = SUBREG_REG (op0);
-             else
-               /* Else we've got some float mode source being extracted into
-                  a different float mode destination -- this combination of
-                  subregs results in Severe Tire Damage.  */
-               abort ();
+             /* Else we've got some float mode source being extracted
+                into a different float mode destination -- this
+                combination of subregs results in Severe Tire
+                Damage.  */
+             gcc_assert (GET_MODE (SUBREG_REG (op0)) == fieldmode
+                         || GET_MODE_CLASS (fieldmode) == MODE_INT
+                         || GET_MODE_CLASS (fieldmode) == MODE_PARTIAL_INT);
+             op0 = SUBREG_REG (op0);
             }
           if (REG_P (op0))
             op0 = gen_rtx_SUBREG (fieldmode, op0, byte_offset);
@@ -462,10 +461,11 @@ store_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
        {
         if (MEM_P (op0))
           op0 = adjust_address (op0, imode, 0);
-       else if (imode != BLKmode)
-         op0 = gen_lowpart (imode, op0);
         else
-         abort ();
+         {
+           gcc_assert (imode != BLKmode);
+           op0 = gen_lowpart (imode, op0);
+         }
        }
    }
  
@@ -510,15 +510,13 @@ store_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
  
        if (GET_CODE (op0) == SUBREG)
         {
-         if (GET_MODE (SUBREG_REG (op0)) == fieldmode
-             || GET_MODE_CLASS (fieldmode) == MODE_INT
-             || GET_MODE_CLASS (fieldmode) == MODE_PARTIAL_INT)
-           op0 = SUBREG_REG (op0);
-         else
-           /* Else we've got some float mode source being extracted into
-              a different float mode destination -- this combination of
-              subregs results in Severe Tire Damage.  */
-           abort ();
+         /* Else we've got some float mode source being extracted into
+            a different float mode destination -- this combination of
+            subregs results in Severe Tire Damage.  */
+         gcc_assert (GET_MODE (SUBREG_REG (op0)) == fieldmode
+                     || GET_MODE_CLASS (fieldmode) == MODE_INT
+                     || GET_MODE_CLASS (fieldmode) == MODE_PARTIAL_INT);
+         op0 = SUBREG_REG (op0);
         }
  
        emit_insn (GEN_FCN (icode)
@@ -589,12 +587,10 @@ store_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
                  pseudo.  We can trivially remove a SUBREG that does not
                  change the size of the operand.  Such a SUBREG may have been
                  added above.  Otherwise, abort.  */
-             if (GET_CODE (op0) == SUBREG
-                 && (GET_MODE_SIZE (GET_MODE (op0))
-                     == GET_MODE_SIZE (GET_MODE (SUBREG_REG (op0)))))
-               op0 = SUBREG_REG (op0);
-             else
-               abort ();
+             gcc_assert (GET_CODE (op0) == SUBREG
+                         && (GET_MODE_SIZE (GET_MODE (op0))
+                             == GET_MODE_SIZE (GET_MODE (SUBREG_REG (op0)))));
+             op0 = SUBREG_REG (op0);
             }
           op0 = gen_rtx_SUBREG (mode_for_size (BITS_PER_WORD, MODE_INT, 0),
                                 op0, (offset * UNITS_PER_WORD));
@@ -606,6 +602,7 @@ store_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
       corresponding size.  This can occur on a machine with 64 bit registers
       that uses SFmode for float.  This can also occur for unaligned float
       structure fields.  */
+  orig_value = value;
    if (GET_MODE_CLASS (GET_MODE (value)) != MODE_INT
        && GET_MODE_CLASS (GET_MODE (value)) != MODE_PARTIAL_INT)
      value = gen_lowpart ((GET_MODE (value) == VOIDmode
@@ -672,7 +669,7 @@ store_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
           /* Fetch that unit, store the bitfield in it, then store
              the unit.  */
           tempreg = copy_to_reg (op0);
-         store_bit_field (tempreg, bitsize, bitpos, fieldmode, value);
+         store_bit_field (tempreg, bitsize, bitpos, fieldmode, orig_value);
           emit_move_insn (op0, tempreg);
           return value;
         }
@@ -731,12 +728,12 @@ store_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
             }
           else if (GET_CODE (value) == CONST_INT)
             value1 = gen_int_mode (INTVAL (value), maxmode);
-         else if (!CONSTANT_P (value))
+         else
             /* Parse phase is supposed to make VALUE's data type
                match that of the component reference, which is a type
                at least as wide as the field; so VALUE should have
                a mode that corresponds to that type.  */
-           abort ();
+           gcc_assert (CONSTANT_P (value));
         }
  
        /* If this machine's insv insists on a register,
@@ -790,8 +787,7 @@ store_fixed_bit_field (rtx op0, unsigned HOST_WIDE_INT offset,
  
    if (REG_P (op0) || GET_CODE (op0) == SUBREG)
      {
-      if (offset != 0)
-       abort ();
+      gcc_assert (!offset);
        /* Special treatment for a bit field split across two registers.  */
        if (bitsize + bitpos > BITS_PER_WORD)
         {
@@ -899,8 +895,7 @@ store_fixed_bit_field (rtx op0, unsigned HOST_WIDE_INT offset,
                               NULL_RTX, 1, OPTAB_LIB_WIDEN);
        if (bitpos > 0)
         value = expand_shift (LSHIFT_EXPR, mode, value,
-                             build_int_cst (NULL_TREE,
-                                            bitpos, 0), NULL_RTX, 1);
+                             build_int_cst (NULL_TREE, bitpos), NULL_RTX, 1);
      }
  
    /* Now clear the chosen bits in OP0,
@@ -1147,10 +1142,9 @@ extract_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
  
        /* We could handle this, but we should always be called with a pseudo
          for our targets and all insns should take them as outputs.  */
-      if (! (*insn_data[icode].operand[0].predicate) (dest, mode0)
-         || ! (*insn_data[icode].operand[1].predicate) (src, mode1)
-         || ! (*insn_data[icode].operand[2].predicate) (rtxpos, mode2))
-       abort ();
+      gcc_assert ((*insn_data[icode].operand[0].predicate) (dest, mode0)
+                 && (*insn_data[icode].operand[1].predicate) (src, mode1)
+                 && (*insn_data[icode].operand[2].predicate) (rtxpos, mode2));
  
        pat = GEN_FCN (icode) (dest, src, rtxpos);
        seq = get_insns ();
@@ -1171,10 +1165,11 @@ extract_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
        {
         if (MEM_P (op0))
           op0 = adjust_address (op0, imode, 0);
-       else if (imode != BLKmode)
-         op0 = gen_lowpart (imode, op0);
         else
-         abort ();
+         {
+           gcc_assert (imode != BLKmode);
+           op0 = gen_lowpart (imode, op0);
+         }
        }
    }
  
@@ -1238,22 +1233,16 @@ extract_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
      {
        if (mode1 != GET_MODE (op0))
         {
-         if (GET_CODE (op0) == SUBREG)
+         if (MEM_P (op0))
+           op0 = adjust_address (op0, mode1, offset);
+         else
             {
-             if (GET_MODE (SUBREG_REG (op0)) == mode1
-                 || GET_MODE_CLASS (mode1) == MODE_INT
-                 || GET_MODE_CLASS (mode1) == MODE_PARTIAL_INT)
-               op0 = SUBREG_REG (op0);
-             else
-               /* Else we've got some float mode source being extracted into
-                  a different float mode destination -- this combination of
-                  subregs results in Severe Tire Damage.  */
+             rtx sub = simplify_gen_subreg (mode1, op0, GET_MODE (op0),
+                                            byte_offset);
+             if (sub == NULL)
                 goto no_subreg_mode_swap;
+             op0 = sub;
             }
-         if (REG_P (op0))
-           op0 = gen_rtx_SUBREG (mode1, op0, byte_offset);
-         else
-           op0 = adjust_address (op0, mode1, offset);
         }
        if (mode1 != mode)
         return convert_to_mode (tmode, op0, unsignedp);
@@ -1300,8 +1289,7 @@ extract_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
                                  bitnum + bit_offset, 1, target_part, mode,
                                  word_mode);
  
-         if (target_part == 0)
-           abort ();
+         gcc_assert (target_part);
  
           if (result_part != target_part)
             emit_move_insn (target_part, result_part);
@@ -1329,13 +1317,11 @@ extract_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
        /* Signed bit field: sign-extend with two arithmetic shifts.  */
        target = expand_shift (LSHIFT_EXPR, mode, target,
                              build_int_cst (NULL_TREE,
-                                           GET_MODE_BITSIZE (mode) - bitsize,
-                                           0),
+                                           GET_MODE_BITSIZE (mode) - bitsize),
                              NULL_RTX, 0);
        return expand_shift (RSHIFT_EXPR, mode, target,
                            build_int_cst (NULL_TREE,
-                                         GET_MODE_BITSIZE (mode) - bitsize,
-                                         0),
+                                         GET_MODE_BITSIZE (mode) - bitsize),
                            NULL_RTX, 0);
      }
  
@@ -1349,13 +1335,11 @@ extract_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
    int_mode = int_mode_for_mode (tmode);
    if (int_mode == BLKmode)
      int_mode = int_mode_for_mode (mode);
-  if (int_mode == BLKmode)
-    abort ();    /* Should probably push op0 out to memory and then
-                   do a load.  */
+  /* Should probably push op0 out to memory and then do a load.  */
+  gcc_assert (int_mode != BLKmode);
  
    /* OFFSET is the number of words or bytes (UNIT says which)
       from STR_RTX to the first word or byte containing part of the field.  */
-
    if (!MEM_P (op0))
      {
        if (offset != 0
@@ -1638,19 +1622,41 @@ extract_bit_field (rtx str_rtx, unsigned HOST_WIDE_INT bitsize,
      return spec_target;
    if (GET_MODE (target) != tmode && GET_MODE (target) != mode)
      {
-      /* If the target mode is floating-point, first convert to the
-        integer mode of that size and then access it as a floating-point
-        value via a SUBREG.  */
-      if (GET_MODE_CLASS (tmode) != MODE_INT
-         && GET_MODE_CLASS (tmode) != MODE_PARTIAL_INT)
+      /* If the target mode is complex, then extract the two scalar elements
+        from the value now.  Creating (subreg:SC (reg:DI) 0), as we would do
+        with the clause below, will cause gen_realpart or gen_imagpart to
+        fail, since those functions must return lvalues.  */
+      if (COMPLEX_MODE_P (tmode))
         {
+         rtx realpart, imagpart;
+         enum machine_mode itmode = GET_MODE_INNER (tmode);
+
           target = convert_to_mode (mode_for_size (GET_MODE_BITSIZE (tmode),
                                                    MODE_INT, 0),
                                     target, unsignedp);
+
+         realpart = extract_bit_field (target, GET_MODE_BITSIZE (itmode), 0,
+                                       unsignedp, NULL, itmode, itmode);
+         imagpart = extract_bit_field (target, GET_MODE_BITSIZE (itmode),
+                                       GET_MODE_BITSIZE (itmode), unsignedp,
+                                       NULL, itmode, itmode);
+
+         return gen_rtx_CONCAT (tmode, realpart, imagpart);
+       }
+
+      /* If the target mode is not a scalar integral, first convert to the
+        integer mode of that size and then access it as a floating-point
+        value via a SUBREG.  */
+      if (!SCALAR_INT_MODE_P (tmode))
+       {
+         enum machine_mode smode
+           = mode_for_size (GET_MODE_BITSIZE (tmode), MODE_INT, 0);
+         target = convert_to_mode (smode, target, unsignedp);
+         target = force_reg (smode, target);
           return gen_lowpart (tmode, target);
         }
-      else
-       return convert_to_mode (tmode, target, unsignedp);
+
+      return convert_to_mode (tmode, target, unsignedp);
      }
    return target;
  }
@@ -1740,7 +1746,7 @@ extract_fixed_bit_field (enum machine_mode tmode, rtx op0,
         {
           /* If the field does not already start at the lsb,
              shift it so it does.  */
-         tree amount = build_int_cst (NULL_TREE, bitpos, 0);
+         tree amount = build_int_cst (NULL_TREE, bitpos);
           /* Maybe propagate the target for the shift.  */
           /* But not if we will return it--could confuse integrate.c.  */
           rtx subtarget = (target != 0 && REG_P (target) ? target : 0);
@@ -1781,7 +1787,7 @@ extract_fixed_bit_field (enum machine_mode tmode, rtx op0,
      {
        tree amount
         = build_int_cst (NULL_TREE,
-                        GET_MODE_BITSIZE (mode) - (bitsize + bitpos), 0);
+                        GET_MODE_BITSIZE (mode) - (bitsize + bitpos));
        /* Maybe propagate the target for the shift.  */
        rtx subtarget = (target != 0 && REG_P (target) ? target : 0);
        op0 = expand_shift (LSHIFT_EXPR, mode, op0, amount, subtarget, 1);
@@ -1789,7 +1795,7 @@ extract_fixed_bit_field (enum machine_mode tmode, rtx op0,
  
    return expand_shift (RSHIFT_EXPR, mode, op0,
                        build_int_cst (NULL_TREE,
-                                     GET_MODE_BITSIZE (mode) - bitsize, 0),
+                                     GET_MODE_BITSIZE (mode) - bitsize),
                        target, 0);
  }
  \f
@@ -1863,6 +1869,152 @@ lshift_value (enum machine_mode mode, rtx value, int bitpos, int bitsize)
    return immed_double_const (low, high, mode);
  }
  \f
+/* Extract a bit field from a memory by forcing the alignment of the
+   memory.  This efficient only if the field spans at least 4 boundaries.
+
+   OP0 is the MEM.
+   BITSIZE is the field width; BITPOS is the position of the first bit.
+   UNSIGNEDP is true if the result should be zero-extended.  */
+
+static rtx
+extract_force_align_mem_bit_field (rtx op0, unsigned HOST_WIDE_INT bitsize,
+                                  unsigned HOST_WIDE_INT bitpos,
+                                  int unsignedp)
+{
+  enum machine_mode mode, dmode;
+  unsigned int m_bitsize, m_size;
+  unsigned int sign_shift_up, sign_shift_dn;
+  rtx base, a1, a2, v1, v2, comb, shift, result, start;
+
+  /* Choose a mode that will fit BITSIZE.  */
+  mode = smallest_mode_for_size (bitsize, MODE_INT);
+  m_size = GET_MODE_SIZE (mode);
+  m_bitsize = GET_MODE_BITSIZE (mode);
+
+  /* Choose a mode twice as wide.  Fail if no such mode exists.  */
+  dmode = mode_for_size (m_bitsize * 2, MODE_INT, false);
+  if (dmode == BLKmode)
+    return NULL;
+
+  do_pending_stack_adjust ();
+  start = get_last_insn ();
+
+  /* At the end, we'll need an additional shift to deal with sign/zero
+     extension.  By default this will be a left+right shift of the
+     appropriate size.  But we may be able to eliminate one of them.  */
+  sign_shift_up = sign_shift_dn = m_bitsize - bitsize;
+
+  if (STRICT_ALIGNMENT)
+    {
+      base = plus_constant (XEXP (op0, 0), bitpos / BITS_PER_UNIT);
+      bitpos %= BITS_PER_UNIT;
+
+      /* We load two values to be concatenate.  There's an edge condition
+        that bears notice -- an aligned value at the end of a page can
+        only load one value lest we segfault.  So the two values we load
+        are at "base & -size" and "(base + size - 1) & -size".  If base
+        is unaligned, the addresses will be aligned and sequential; if
+        base is aligned, the addresses will both be equal to base.  */
+
+      a1 = expand_simple_binop (Pmode, AND, force_operand (base, NULL),
+                               GEN_INT (-(HOST_WIDE_INT)m_size),
+                               NULL, true, OPTAB_LIB_WIDEN);
+      mark_reg_pointer (a1, m_bitsize);
+      v1 = gen_rtx_MEM (mode, a1);
+      set_mem_align (v1, m_bitsize);
+      v1 = force_reg (mode, validize_mem (v1));
+
+      a2 = plus_constant (base, GET_MODE_SIZE (mode) - 1);
+      a2 = expand_simple_binop (Pmode, AND, force_operand (a2, NULL),
+                               GEN_INT (-(HOST_WIDE_INT)m_size),
+                               NULL, true, OPTAB_LIB_WIDEN);
+      v2 = gen_rtx_MEM (mode, a2);
+      set_mem_align (v2, m_bitsize);
+      v2 = force_reg (mode, validize_mem (v2));
+
+      /* Combine these two values into a double-word value.  */
+      if (m_bitsize == BITS_PER_WORD)
+       {
+         comb = gen_reg_rtx (dmode);
+         emit_insn (gen_rtx_CLOBBER (VOIDmode, comb));
+         emit_move_insn (gen_rtx_SUBREG (mode, comb, 0), v1);
+         emit_move_insn (gen_rtx_SUBREG (mode, comb, m_size), v2);
+       }
+      else
+       {
+         if (BYTES_BIG_ENDIAN)
+           comb = v1, v1 = v2, v2 = comb;
+         v1 = convert_modes (dmode, mode, v1, true);
+         if (v1 == NULL)
+           goto fail;
+         v2 = convert_modes (dmode, mode, v2, true);
+         v2 = expand_simple_binop (dmode, ASHIFT, v2, GEN_INT (m_bitsize),
+                                   NULL, true, OPTAB_LIB_WIDEN);
+         if (v2 == NULL)
+           goto fail;
+         comb = expand_simple_binop (dmode, IOR, v1, v2, NULL,
+                                     true, OPTAB_LIB_WIDEN);
+         if (comb == NULL)
+           goto fail;
+       }
+
+      shift = expand_simple_binop (Pmode, AND, base, GEN_INT (m_size - 1),
+                                  NULL, true, OPTAB_LIB_WIDEN);
+      shift = expand_mult (Pmode, shift, GEN_INT (BITS_PER_UNIT), NULL, 1);
+
+      if (bitpos != 0)
+       {
+         if (sign_shift_up <= bitpos)
+           bitpos -= sign_shift_up, sign_shift_up = 0;
+         shift = expand_simple_binop (Pmode, PLUS, shift, GEN_INT (bitpos),
+                                      NULL, true, OPTAB_LIB_WIDEN);
+       }
+    }
+  else
+    {
+      unsigned HOST_WIDE_INT offset = bitpos / BITS_PER_UNIT;
+      bitpos %= BITS_PER_UNIT;
+
+      /* When strict alignment is not required, we can just load directly
+        from memory without masking.  If the remaining BITPOS offset is
+        small enough, we may be able to do all operations in MODE as 
+        opposed to DMODE.  */
+      if (bitpos + bitsize <= m_bitsize)
+       dmode = mode;
+      comb = adjust_address (op0, dmode, offset);
+
+      if (sign_shift_up <= bitpos)
+       bitpos -= sign_shift_up, sign_shift_up = 0;
+      shift = GEN_INT (bitpos);
+    }
+
+  /* Shift down the double-word such that the requested value is at bit 0.  */
+  if (shift != const0_rtx)
+    comb = expand_simple_binop (dmode, unsignedp ? LSHIFTRT : ASHIFTRT,
+                               comb, shift, NULL, unsignedp, OPTAB_LIB_WIDEN);
+  if (comb == NULL)
+    goto fail;
+
+  /* If the field exactly matches MODE, then all we need to do is return the
+     lowpart.  Otherwise, shift to get the sign bits set properly.  */
+  result = force_reg (mode, gen_lowpart (mode, comb));
+
+  if (sign_shift_up)
+    result = expand_simple_binop (mode, ASHIFT, result,
+                                 GEN_INT (sign_shift_up),
+                                 NULL_RTX, 0, OPTAB_LIB_WIDEN);
+  if (sign_shift_dn)
+    result = expand_simple_binop (mode, unsignedp ? LSHIFTRT : ASHIFTRT,
+                                 result, GEN_INT (sign_shift_dn),
+                                 NULL_RTX, 0, OPTAB_LIB_WIDEN);
+
+  return result;
+
+ fail:
+  delete_insns_since (start);
+  return NULL;
+}
+
  /* Extract a bit field that is split across two words
     and return an RTX for the result.
  
@@ -1884,7 +2036,16 @@ extract_split_bit_field (rtx op0, unsigned HOST_WIDE_INT bitsize,
    if (REG_P (op0) || GET_CODE (op0) == SUBREG)
      unit = BITS_PER_WORD;
    else
-    unit = MIN (MEM_ALIGN (op0), BITS_PER_WORD);
+    {
+      unit = MIN (MEM_ALIGN (op0), BITS_PER_WORD);
+      if (0 && bitsize / unit > 2)
+       {
+         rtx tmp = extract_force_align_mem_bit_field (op0, bitsize, bitpos,
+                                                      unsignedp);
+         if (tmp)
+           return tmp;
+       }
+    }
  
    while (bitsdone < bitsize)
      {
@@ -1937,15 +2098,15 @@ extract_split_bit_field (rtx op0, unsigned HOST_WIDE_INT bitsize,
         {
           if (bitsize != bitsdone)
             part = expand_shift (LSHIFT_EXPR, word_mode, part,
-                                build_int_cst (NULL_TREE,
-                                               bitsize - bitsdone, 0), 0, 1);
+                                build_int_cst (NULL_TREE, bitsize - bitsdone),
+                                0, 1);
         }
        else
         {
           if (bitsdone != thissize)
             part = expand_shift (LSHIFT_EXPR, word_mode, part,
                                  build_int_cst (NULL_TREE,
-                                               bitsdone - thissize, 0), 0, 1);
+                                               bitsdone - thissize), 0, 1);
         }
  
        if (first)
@@ -1964,12 +2125,11 @@ extract_split_bit_field (rtx op0, unsigned HOST_WIDE_INT bitsize,
      return result;
    /* Signed bit field: sign-extend with two arithmetic shifts.  */
    result = expand_shift (LSHIFT_EXPR, word_mode, result,
-                        build_int_cst (NULL_TREE,
-                                       BITS_PER_WORD - bitsize, 0),
+                        build_int_cst (NULL_TREE, BITS_PER_WORD - bitsize),
                          NULL_RTX, 0);
    return expand_shift (RSHIFT_EXPR, word_mode, result,
-                      build_int_cst (NULL_TREE,
-                                     BITS_PER_WORD - bitsize, 0), NULL_RTX, 0);
+                      build_int_cst (NULL_TREE, BITS_PER_WORD - bitsize),
+                      NULL_RTX, 0);
  }
  \f
  /* Add INC into TARGET.  */
@@ -2088,7 +2248,7 @@ expand_shift (enum tree_code code, enum machine_mode mode, rtx shifted,
               tree other_amount
                 = fold (build2 (MINUS_EXPR, type, convert
                                 (type, build_int_cst
-                                (NULL_TREE, GET_MODE_BITSIZE (mode), 0)),
+                                (NULL_TREE, GET_MODE_BITSIZE (mode))),
                                 amount));
  
               shifted = force_reg (mode, shifted);
@@ -2149,16 +2309,44 @@ expand_shift (enum tree_code code, enum machine_mode mode, rtx shifted,
          define_expand for lshrsi3 was added to vax.md.  */
      }
  
-  if (temp == 0)
-    abort ();
+  gcc_assert (temp);
    return temp;
  }
  \f
-enum alg_code { alg_zero, alg_m, alg_shift,
+enum alg_code { alg_unknown, alg_zero, alg_m, alg_shift,
                   alg_add_t_m2, alg_sub_t_m2,
                   alg_add_factor, alg_sub_factor,
-                 alg_add_t2_m, alg_sub_t2_m,
-                 alg_add, alg_subtract, alg_factor, alg_shiftop };
+                 alg_add_t2_m, alg_sub_t2_m };
+
+/* This structure holds the "cost" of a multiply sequence.  The
+   "cost" field holds the total rtx_cost of every operator in the
+   synthetic multiplication sequence, hence cost(a op b) is defined
+   as rtx_cost(op) + cost(a) + cost(b), where cost(leaf) is zero.
+   The "latency" field holds the minimum possible latency of the
+   synthetic multiply, on a hypothetical infinitely parallel CPU.
+   This is the critical path, or the maximum height, of the expression
+   tree which is the sum of rtx_costs on the most expensive path from
+   any leaf to the root.  Hence latency(a op b) is defined as zero for
+   leaves and rtx_cost(op) + max(latency(a), latency(b)) otherwise.  */
+
+struct mult_cost {
+  short cost;     /* Total rtx_cost of the multiplication sequence.  */
+  short latency;  /* The latency of the multiplication sequence.  */
+};
+
+/* This macro is used to compare a pointer to a mult_cost against an
+   single integer "rtx_cost" value.  This is equivalent to the macro
+   CHEAPER_MULT_COST(X,Z) where Z = {Y,Y}.  */
+#define MULT_COST_LESS(X,Y) ((X)->cost < (Y)   \
+                            || ((X)->cost == (Y) && (X)->latency < (Y)))
+
+/* This macro is used to compare two pointers to mult_costs against
+   each other.  The macro returns true if X is cheaper than Y.
+   Currently, the cheaper of two mult_costs is the one with the
+   lower "cost".  If "cost"s are tied, the lower latency is cheaper.  */
+#define CHEAPER_MULT_COST(X,Y)  ((X)->cost < (Y)->cost         \
+                                || ((X)->cost == (Y)->cost     \
+                                    && (X)->latency < (Y)->latency))
  
  /* This structure records a sequence of operations.
     `ops' is the number of operations recorded.
@@ -2181,7 +2369,7 @@ enum alg_code { alg_zero, alg_m, alg_shift,
  
  struct algorithm
  {
-  short cost;
+  struct mult_cost cost;
    short ops;
    /* The size of the OP and LOG fields are not directly related to the
       word size, but the worst-case algorithms will be if we have few
@@ -2192,6 +2380,26 @@ struct algorithm
    char log[MAX_BITS_PER_WORD];
  };
  
+/* The entry for our multiplication cache/hash table.  */
+struct alg_hash_entry {
+  /* The number we are multiplying by.  */
+  unsigned int t;
+
+  /* The mode in which we are multiplying something by T.  */
+  enum machine_mode mode;
+
+  /* The best multiplication algorithm for t.  */
+  enum alg_code alg;
+};
+
+/* The number of cache/hash entries.  */
+#define NUM_ALG_HASH_ENTRIES 307
+
+/* Each entry of ALG_HASH caches alg_code for some integer.  This is
+   actually a hash table.  If we have a collision, that the older
+   entry is kicked out.  */
+static struct alg_hash_entry alg_hash[NUM_ALG_HASH_ENTRIES];
+
  /* Indicates the type of fixup needed after a constant multiplication.
     BASIC_VARIANT means no fixup is needed, NEGATE_VARIANT means that
     the result should be negated, and ADD_VARIANT means that the
@@ -2199,7 +2407,7 @@ struct algorithm
  enum mult_variant {basic_variant, negate_variant, add_variant};
  
  static void synth_mult (struct algorithm *, unsigned HOST_WIDE_INT,
-                       int, enum machine_mode mode);
+                       const struct mult_cost *, enum machine_mode mode);
  static bool choose_mult_variant (enum machine_mode, HOST_WIDE_INT,
                                  struct algorithm *, enum mult_variant *, int);
  static rtx expand_mult_const (enum machine_mode, rtx, HOST_WIDE_INT, rtx,
@@ -2219,19 +2427,26 @@ static rtx expand_mult_highpart_optab (enum machine_mode, rtx, rtx, rtx,
  
  static void
  synth_mult (struct algorithm *alg_out, unsigned HOST_WIDE_INT t,
-           int cost_limit, enum machine_mode mode)
+           const struct mult_cost *cost_limit, enum machine_mode mode)
  {
    int m;
    struct algorithm *alg_in, *best_alg;
-  int cost;
+  struct mult_cost best_cost;
+  struct mult_cost new_limit;
+  int op_cost, op_latency;
    unsigned HOST_WIDE_INT q;
    int maxm = MIN (BITS_PER_WORD, GET_MODE_BITSIZE (mode));
+  int hash_index;
+  bool cache_hit = false;
+  enum alg_code cache_alg = alg_zero;
  
    /* Indicate that no algorithm is yet found.  If no algorithm
       is found, this value will be returned and indicate failure.  */
-  alg_out->cost = cost_limit;
+  alg_out->cost.cost = cost_limit->cost + 1;
+  alg_out->cost.latency = cost_limit->latency + 1;
  
-  if (cost_limit <= 0)
+  if (cost_limit->cost < 0
+      || (cost_limit->cost == 0 && cost_limit->latency <= 0))
      return;
  
    /* Restrict the bits of "t" to the multiplication's mode.  */
@@ -2241,7 +2456,8 @@ synth_mult (struct algorithm *alg_out, unsigned HOST_WIDE_INT t,
    if (t == 1)
      {
        alg_out->ops = 1;
-      alg_out->cost = 0;
+      alg_out->cost.cost = 0;
+      alg_out->cost.latency = 0;
        alg_out->op[0] = alg_m;
        return;
      }
@@ -2250,12 +2466,13 @@ synth_mult (struct algorithm *alg_out, unsigned HOST_WIDE_INT t,
       fail now.  */
    if (t == 0)
      {
-      if (zero_cost >= cost_limit)
+      if (MULT_COST_LESS (cost_limit, zero_cost))
         return;
        else
         {
           alg_out->ops = 1;
-         alg_out->cost = zero_cost;
+         alg_out->cost.cost = zero_cost;
+         alg_out->cost.latency = zero_cost;
           alg_out->op[0] = alg_zero;
           return;
         }
@@ -2265,12 +2482,48 @@ synth_mult (struct algorithm *alg_out, unsigned HOST_WIDE_INT t,
  
    alg_in = alloca (sizeof (struct algorithm));
    best_alg = alloca (sizeof (struct algorithm));
+  best_cost = *cost_limit;
+
+  /* Compute the hash index.  */
+  hash_index = (t ^ (unsigned int) mode) % NUM_ALG_HASH_ENTRIES;
+
+  /* See if we already know what to do for T.  */
+  if (alg_hash[hash_index].t == t
+      && alg_hash[hash_index].mode == mode
+      && alg_hash[hash_index].alg != alg_unknown)
+    {
+      cache_hit = true;
+      cache_alg = alg_hash[hash_index].alg;
+      switch (cache_alg)
+       {
+       case alg_shift:
+         goto do_alg_shift;
+
+       case alg_add_t_m2:
+       case alg_sub_t_m2:
+         goto do_alg_addsub_t_m2;
+
+       case alg_add_factor:
+       case alg_sub_factor:
+         goto do_alg_addsub_factor;
+
+       case alg_add_t2_m:
+         goto do_alg_add_t2_m;
+
+       case alg_sub_t2_m:
+         goto do_alg_sub_t2_m;
+
+       default:
+         gcc_unreachable ();
+       }
+    }
  
    /* If we have a group of zero bits at the low-order part of T, try
       multiplying by the remaining bits and then doing a shift.  */
  
    if ((t & 1) == 0)
      {
+    do_alg_shift:
        m = floor_log2 (t & -t); /* m = number of low zero bits */
        if (m < maxm)
         {
@@ -2278,21 +2531,26 @@ synth_mult (struct algorithm *alg_out, unsigned HOST_WIDE_INT t,
           /* The function expand_shift will choose between a shift and
              a sequence of additions, so the observed cost is given as
              MIN (m * add_cost[mode], shift_cost[mode][m]).  */
-         cost = m * add_cost[mode];
-         if (shift_cost[mode][m] < cost)
-           cost = shift_cost[mode][m];
-         synth_mult (alg_in, q, cost_limit - cost, mode);
-
-         cost += alg_in->cost;
-         if (cost < cost_limit)
+         op_cost = m * add_cost[mode];
+         if (shift_cost[mode][m] < op_cost)
+           op_cost = shift_cost[mode][m];
+         new_limit.cost = best_cost.cost - op_cost;
+         new_limit.latency = best_cost.latency - op_cost;
+         synth_mult (alg_in, q, &new_limit, mode);
+
+         alg_in->cost.cost += op_cost;
+         alg_in->cost.latency += op_cost;
+         if (CHEAPER_MULT_COST (&alg_in->cost, &best_cost))
             {
               struct algorithm *x;
+             best_cost = alg_in->cost;
               x = alg_in, alg_in = best_alg, best_alg = x;
               best_alg->log[best_alg->ops] = m;
               best_alg->op[best_alg->ops] = alg_shift;
-             cost_limit = cost;
             }
         }
+      if (cache_hit)
+       goto done;
      }
  
    /* If we have an odd number, add or subtract one.  */
@@ -2300,6 +2558,7 @@ synth_mult (struct algorithm *alg_out, unsigned HOST_WIDE_INT t,
      {
        unsigned HOST_WIDE_INT w;
  
+    do_alg_addsub_t_m2:
        for (w = 1; (w & t) != 0; w <<= 1)
         ;
        /* If T was -1, then W will be zero after the loop.  This is another
@@ -2315,36 +2574,44 @@ synth_mult (struct algorithm *alg_out, unsigned HOST_WIDE_INT t,
         {
           /* T ends with ...111.  Multiply by (T + 1) and subtract 1.  */
  
-         cost = add_cost[mode];
-         synth_mult (alg_in, t + 1, cost_limit - cost, mode);
+         op_cost = add_cost[mode];
+         new_limit.cost = best_cost.cost - op_cost;
+         new_limit.latency = best_cost.latency - op_cost;
+         synth_mult (alg_in, t + 1, &new_limit, mode);
  
-         cost += alg_in->cost;
-         if (cost < cost_limit)
+         alg_in->cost.cost += op_cost;
+         alg_in->cost.latency += op_cost;
+         if (CHEAPER_MULT_COST (&alg_in->cost, &best_cost))
             {
               struct algorithm *x;
+             best_cost = alg_in->cost;
               x = alg_in, alg_in = best_alg, best_alg = x;
               best_alg->log[best_alg->ops] = 0;
               best_alg->op[best_alg->ops] = alg_sub_t_m2;
-             cost_limit = cost;
             }
         }
        else
         {
           /* T ends with ...01 or ...011.  Multiply by (T - 1) and add 1.  */
  
-         cost = add_cost[mode];
-         synth_mult (alg_in, t - 1, cost_limit - cost, mode);
+         op_cost = add_cost[mode];
+         new_limit.cost = best_cost.cost - op_cost;
+         new_limit.latency = best_cost.latency - op_cost;
+         synth_mult (alg_in, t - 1, &new_limit, mode);
  
-         cost += alg_in->cost;
-         if (cost < cost_limit)
+         alg_in->cost.cost += op_cost;
+         alg_in->cost.latency += op_cost;
+         if (CHEAPER_MULT_COST (&alg_in->cost, &best_cost))
             {
               struct algorithm *x;
+             best_cost = alg_in->cost;
               x = alg_in, alg_in = best_alg, best_alg = x;
               best_alg->log[best_alg->ops] = 0;
               best_alg->op[best_alg->ops] = alg_add_t_m2;
-             cost_limit = cost;
             }
         }
+      if (cache_hit)
+       goto done;
      }
  
    /* Look for factors of t of the form
@@ -2357,100 +2624,159 @@ synth_mult (struct algorithm *alg_out, unsigned HOST_WIDE_INT t,
       good sequence quickly, and therefore be able to prune (by decreasing
       COST_LIMIT) the search.  */
  
+ do_alg_addsub_factor:
    for (m = floor_log2 (t - 1); m >= 2; m--)
      {
        unsigned HOST_WIDE_INT d;
  
        d = ((unsigned HOST_WIDE_INT) 1 << m) + 1;
-      if (t % d == 0 && t > d && m < maxm)
+      if (t % d == 0 && t > d && m < maxm
+         && (!cache_hit || cache_alg == alg_add_factor))
         {
-         cost = add_cost[mode] + shift_cost[mode][m];
-         if (shiftadd_cost[mode][m] < cost)
-           cost = shiftadd_cost[mode][m];
-         synth_mult (alg_in, t / d, cost_limit - cost, mode);
+         /* If the target has a cheap shift-and-add instruction use
+            that in preference to a shift insn followed by an add insn.
+            Assume that the shift-and-add is "atomic" with a latency
+            equal to its cost, otherwise assume that on superscalar
+            hardware the shift may be executed concurrently with the
+            earlier steps in the algorithm.  */
+         op_cost = add_cost[mode] + shift_cost[mode][m];
+         if (shiftadd_cost[mode][m] < op_cost)
+           {
+             op_cost = shiftadd_cost[mode][m];
+             op_latency = op_cost;
+           }
+         else
+           op_latency = add_cost[mode];
+
+         new_limit.cost = best_cost.cost - op_cost;
+         new_limit.latency = best_cost.latency - op_latency;
+         synth_mult (alg_in, t / d, &new_limit, mode);
  
-         cost += alg_in->cost;
-         if (cost < cost_limit)
+         alg_in->cost.cost += op_cost;
+         alg_in->cost.latency += op_latency;
+         if (alg_in->cost.latency < op_cost)
+           alg_in->cost.latency = op_cost;
+         if (CHEAPER_MULT_COST (&alg_in->cost, &best_cost))
             {
               struct algorithm *x;
+             best_cost = alg_in->cost;
               x = alg_in, alg_in = best_alg, best_alg = x;
               best_alg->log[best_alg->ops] = m;
               best_alg->op[best_alg->ops] = alg_add_factor;
-             cost_limit = cost;
             }
           /* Other factors will have been taken care of in the recursion.  */
           break;
         }
  
        d = ((unsigned HOST_WIDE_INT) 1 << m) - 1;
-      if (t % d == 0 && t > d && m < maxm)
+      if (t % d == 0 && t > d && m < maxm
+         && (!cache_hit || cache_alg == alg_sub_factor))
         {
-         cost = add_cost[mode] + shift_cost[mode][m];
-         if (shiftsub_cost[mode][m] < cost)
-           cost = shiftsub_cost[mode][m];
-         synth_mult (alg_in, t / d, cost_limit - cost, mode);
+         /* If the target has a cheap shift-and-subtract insn use
+            that in preference to a shift insn followed by a sub insn.
+            Assume that the shift-and-sub is "atomic" with a latency
+            equal to it's cost, otherwise assume that on superscalar
+            hardware the shift may be executed concurrently with the
+            earlier steps in the algorithm.  */
+         op_cost = add_cost[mode] + shift_cost[mode][m];
+         if (shiftsub_cost[mode][m] < op_cost)
+           {
+             op_cost = shiftsub_cost[mode][m];
+             op_latency = op_cost;
+           }
+         else
+           op_latency = add_cost[mode];
+
+         new_limit.cost = best_cost.cost - op_cost;
+         new_limit.cost = best_cost.cost - op_latency;
+         synth_mult (alg_in, t / d, &new_limit, mode);
  
-         cost += alg_in->cost;
-         if (cost < cost_limit)
+         alg_in->cost.cost += op_cost;
+         alg_in->cost.latency += op_latency;
+         if (alg_in->cost.latency < op_cost)
+           alg_in->cost.latency = op_cost;
+         if (CHEAPER_MULT_COST (&alg_in->cost, &best_cost))
             {
               struct algorithm *x;
+             best_cost = alg_in->cost;
               x = alg_in, alg_in = best_alg, best_alg = x;
               best_alg->log[best_alg->ops] = m;
               best_alg->op[best_alg->ops] = alg_sub_factor;
-             cost_limit = cost;
             }
           break;
         }
      }
+  if (cache_hit)
+    goto done;
  
    /* Try shift-and-add (load effective address) instructions,
       i.e. do a*3, a*5, a*9.  */
    if ((t & 1) != 0)
      {
+    do_alg_add_t2_m:
        q = t - 1;
        q = q & -q;
        m = exact_log2 (q);
        if (m >= 0 && m < maxm)
         {
-         cost = shiftadd_cost[mode][m];
-         synth_mult (alg_in, (t - 1) >> m, cost_limit - cost, mode);
-
-         cost += alg_in->cost;
-         if (cost < cost_limit)
+         op_cost = shiftadd_cost[mode][m];
+         new_limit.cost = best_cost.cost - op_cost;
+         new_limit.latency = best_cost.latency - op_cost;
+         synth_mult (alg_in, (t - 1) >> m, &new_limit, mode);
+
+         alg_in->cost.cost += op_cost;
+         alg_in->cost.latency += op_cost;
+         if (CHEAPER_MULT_COST (&alg_in->cost, &best_cost))
             {
               struct algorithm *x;
+             best_cost = alg_in->cost;
               x = alg_in, alg_in = best_alg, best_alg = x;
               best_alg->log[best_alg->ops] = m;
               best_alg->op[best_alg->ops] = alg_add_t2_m;
-             cost_limit = cost;
             }
         }
+      if (cache_hit)
+       goto done;
  
+    do_alg_sub_t2_m:
        q = t + 1;
        q = q & -q;
        m = exact_log2 (q);
        if (m >= 0 && m < maxm)
         {
-         cost = shiftsub_cost[mode][m];
-         synth_mult (alg_in, (t + 1) >> m, cost_limit - cost, mode);
-
-         cost += alg_in->cost;
-         if (cost < cost_limit)
+         op_cost = shiftsub_cost[mode][m];
+         new_limit.cost = best_cost.cost - op_cost;
+         new_limit.latency = best_cost.latency - op_cost;
+         synth_mult (alg_in, (t + 1) >> m, &new_limit, mode);
+
+         alg_in->cost.cost += op_cost;
+         alg_in->cost.latency += op_cost;
+         if (CHEAPER_MULT_COST (&alg_in->cost, &best_cost))
             {
               struct algorithm *x;
+             best_cost = alg_in->cost;
               x = alg_in, alg_in = best_alg, best_alg = x;
               best_alg->log[best_alg->ops] = m;
               best_alg->op[best_alg->ops] = alg_sub_t2_m;
-             cost_limit = cost;
             }
         }
+      if (cache_hit)
+       goto done;
      }
  
-  /* If cost_limit has not decreased since we stored it in alg_out->cost,
-     we have not found any algorithm.  */
-  if (cost_limit == alg_out->cost)
+ done:
+  /* If best_cost has not decreased, we have not found any algorithm.  */
+  if (!CHEAPER_MULT_COST (&best_cost, cost_limit))
      return;
  
+  /* Cache the result.  */
+  if (!cache_hit)
+    {
+      alg_hash[hash_index].t = t;
+      alg_hash[hash_index].mode = mode;
+      alg_hash[hash_index].alg = best_alg->op[best_alg->ops];
+    }
+
    /* If we are getting a too long sequence for `struct algorithm'
       to record, make this search fail.  */
    if (best_alg->ops == MAX_BITS_PER_WORD)
@@ -2460,7 +2786,7 @@ synth_mult (struct algorithm *alg_out, unsigned HOST_WIDE_INT t,
       We avoid using structure assignment because the majority of
       best_alg is normally undefined, and this is a critical function.  */
    alg_out->ops = best_alg->ops + 1;
-  alg_out->cost = cost_limit;
+  alg_out->cost = best_cost;
    memcpy (alg_out->op, best_alg->op,
           alg_out->ops * sizeof *alg_out->op);
    memcpy (alg_out->log, best_alg->log,
@@ -2483,29 +2809,57 @@ choose_mult_variant (enum machine_mode mode, HOST_WIDE_INT val,
                      int mult_cost)
  {
    struct algorithm alg2;
+  struct mult_cost limit;
+  int op_cost;
  
    *variant = basic_variant;
-  synth_mult (alg, val, mult_cost, mode);
+  limit.cost = mult_cost;
+  limit.latency = mult_cost;
+  synth_mult (alg, val, &limit, mode);
  
    /* This works only if the inverted value actually fits in an
       `unsigned int' */
    if (HOST_BITS_PER_INT >= GET_MODE_BITSIZE (mode))
      {
-      synth_mult (&alg2, -val, MIN (alg->cost, mult_cost) - neg_cost[mode],
-                 mode);
-      alg2.cost += neg_cost[mode];
-      if (alg2.cost < alg->cost)
+      op_cost = neg_cost[mode];
+      if (MULT_COST_LESS (&alg->cost, mult_cost))
+       {
+         limit.cost = alg->cost.cost - op_cost;
+         limit.latency = alg->cost.latency - op_cost;
+       }
+      else
+       {
+         limit.cost = mult_cost - op_cost;
+         limit.latency = mult_cost - op_cost;
+       }
+
+      synth_mult (&alg2, -val, &limit, mode);
+      alg2.cost.cost += op_cost;
+      alg2.cost.latency += op_cost;
+      if (CHEAPER_MULT_COST (&alg2.cost, &alg->cost))
         *alg = alg2, *variant = negate_variant;
      }
  
    /* This proves very useful for division-by-constant.  */
-  synth_mult (&alg2, val - 1, MIN (alg->cost, mult_cost) - add_cost[mode],
-             mode);
-  alg2.cost += add_cost[mode];
-  if (alg2.cost < alg->cost)
+  op_cost = add_cost[mode];
+  if (MULT_COST_LESS (&alg->cost, mult_cost))
+    {
+      limit.cost = alg->cost.cost - op_cost;
+      limit.latency = alg->cost.latency - op_cost;
+    }
+  else
+    {
+      limit.cost = mult_cost - op_cost;
+      limit.latency = mult_cost - op_cost;
+    }
+
+  synth_mult (&alg2, val - 1, &limit, mode);
+  alg2.cost.cost += op_cost;
+  alg2.cost.latency += op_cost;
+  if (CHEAPER_MULT_COST (&alg2.cost, &alg->cost))
      *alg = alg2, *variant = add_variant;
  
-  return alg->cost < mult_cost;
+  return MULT_COST_LESS (&alg->cost, mult_cost);
  }
  
  /* A subroutine of expand_mult, used for constant multiplications.
@@ -2542,7 +2896,7 @@ expand_mult_const (enum machine_mode mode, rtx op0, HOST_WIDE_INT val,
        val_so_far = 1;
      }
    else
-    abort ();
+    gcc_unreachable ();
  
    for (opno = 1; opno < alg->ops; opno++)
      {
@@ -2558,14 +2912,14 @@ expand_mult_const (enum machine_mode mode, rtx op0, HOST_WIDE_INT val,
         {
         case alg_shift:
           accum = expand_shift (LSHIFT_EXPR, mode, accum,
-                               build_int_cst (NULL_TREE, log, 0),
+                               build_int_cst (NULL_TREE, log),
                                 NULL_RTX, 0);
           val_so_far <<= log;
           break;
  
         case alg_add_t_m2:
           tem = expand_shift (LSHIFT_EXPR, mode, op0,
-                             build_int_cst (NULL_TREE, log, 0),
+                             build_int_cst (NULL_TREE, log),
                               NULL_RTX, 0);
           accum = force_operand (gen_rtx_PLUS (mode, accum, tem),
                                  add_target ? add_target : accum_target);
@@ -2574,7 +2928,7 @@ expand_mult_const (enum machine_mode mode, rtx op0, HOST_WIDE_INT val,
  
         case alg_sub_t_m2:
           tem = expand_shift (LSHIFT_EXPR, mode, op0,
-                             build_int_cst (NULL_TREE, log, 0),
+                             build_int_cst (NULL_TREE, log),
                               NULL_RTX, 0);
           accum = force_operand (gen_rtx_MINUS (mode, accum, tem),
                                  add_target ? add_target : accum_target);
@@ -2583,7 +2937,7 @@ expand_mult_const (enum machine_mode mode, rtx op0, HOST_WIDE_INT val,
  
         case alg_add_t2_m:
           accum = expand_shift (LSHIFT_EXPR, mode, accum,
-                               build_int_cst (NULL_TREE, log, 0),
+                               build_int_cst (NULL_TREE, log),
                                 shift_subtarget,
                                 0);
           accum = force_operand (gen_rtx_PLUS (mode, accum, op0),
@@ -2593,7 +2947,7 @@ expand_mult_const (enum machine_mode mode, rtx op0, HOST_WIDE_INT val,
  
         case alg_sub_t2_m:
           accum = expand_shift (LSHIFT_EXPR, mode, accum,
-                               build_int_cst (NULL_TREE, log, 0),
+                               build_int_cst (NULL_TREE, log),
                                 shift_subtarget, 0);
           accum = force_operand (gen_rtx_MINUS (mode, accum, op0),
                                  add_target ? add_target : accum_target);
@@ -2602,7 +2956,7 @@ expand_mult_const (enum machine_mode mode, rtx op0, HOST_WIDE_INT val,
  
         case alg_add_factor:
           tem = expand_shift (LSHIFT_EXPR, mode, accum,
-                             build_int_cst (NULL_TREE, log, 0),
+                             build_int_cst (NULL_TREE, log),
                               NULL_RTX, 0);
           accum = force_operand (gen_rtx_PLUS (mode, accum, tem),
                                  add_target ? add_target : accum_target);
@@ -2611,7 +2965,7 @@ expand_mult_const (enum machine_mode mode, rtx op0, HOST_WIDE_INT val,
  
         case alg_sub_factor:
           tem = expand_shift (LSHIFT_EXPR, mode, accum,
-                             build_int_cst (NULL_TREE, log, 0),
+                             build_int_cst (NULL_TREE, log),
                               NULL_RTX, 0);
           accum = force_operand (gen_rtx_MINUS (mode, tem, accum),
                                  (add_target
@@ -2620,7 +2974,7 @@ expand_mult_const (enum machine_mode mode, rtx op0, HOST_WIDE_INT val,
           break;
  
         default:
-         abort ();
+         gcc_unreachable ();
         }
  
        /* Write a REG_EQUAL note on the last insn so that we can cse
@@ -2655,8 +3009,7 @@ expand_mult_const (enum machine_mode mode, rtx op0, HOST_WIDE_INT val,
       in the result mode, to avoid sign-/zero-extension confusion.  */
    val &= GET_MODE_MASK (mode);
    val_so_far &= GET_MODE_MASK (mode);
-  if (val != val_so_far)
-    abort ();
+  gcc_assert (val == val_so_far);
  
    return accum;
  }
@@ -2741,8 +3094,7 @@ expand_mult (enum machine_mode mode, rtx op0, rtx op1, rtx target,
                       && flag_trapv && (GET_MODE_CLASS(mode) == MODE_INT)
                       ? smulv_optab : smul_optab,
                       op0, op1, target, unsignedp, OPTAB_LIB_WIDEN);
-  if (op0 == 0)
-    abort ();
+  gcc_assert (op0);
    return op0;
  }
  \f
@@ -2786,18 +3138,15 @@ choose_multiplier (unsigned HOST_WIDE_INT d, int n, int precision,
    /* lgup = ceil(log2(divisor)); */
    lgup = ceil_log2 (d);
  
-  if (lgup > n)
-    abort ();
+  gcc_assert (lgup <= n);
  
    pow = n + lgup;
    pow2 = n + lgup - precision;
  
-  if (pow == 2 * HOST_BITS_PER_WIDE_INT)
-    {
-      /* We could handle this with some effort, but this case is much better
-        handled directly with a scc insn, so rely on caller using that.  */
-      abort ();
-    }
+  /* We could handle this with some effort, but this case is much
+     better handled directly with a scc insn, so rely on caller using
+     that.  */
+  gcc_assert (pow != 2 * HOST_BITS_PER_WIDE_INT);
  
    /* mlow = 2^(N + lgup)/d */
   if (pow >= HOST_BITS_PER_WIDE_INT)
@@ -2821,13 +3170,11 @@ choose_multiplier (unsigned HOST_WIDE_INT d, int n, int precision,
    div_and_round_double (TRUNC_DIV_EXPR, 1, nl, nh, d, (HOST_WIDE_INT) 0,
                         &mhigh_lo, &mhigh_hi, &dummy1, &dummy2);
  
-  if (mhigh_hi && nh - d >= d)
-    abort ();
-  if (mhigh_hi > 1 || mlow_hi > 1)
-    abort ();
+  gcc_assert (!mhigh_hi || nh - d < d);
+  gcc_assert (mhigh_hi <= 1 && mlow_hi <= 1);
    /* Assert that mlow < mhigh.  */
-  if (! (mlow_hi < mhigh_hi || (mlow_hi == mhigh_hi && mlow_lo < mhigh_lo)))
-    abort ();
+  gcc_assert (mlow_hi < mhigh_hi
+             || (mlow_hi == mhigh_hi && mlow_lo < mhigh_lo));
  
    /* If precision == N, then mlow, mhigh exceed 2^N
       (but they do not exceed 2^(N+1)).  */
@@ -2907,8 +3254,7 @@ expand_mult_highpart_adjust (enum machine_mode mode, rtx adj_operand, rtx op0,
    enum rtx_code adj_code = unsignedp ? PLUS : MINUS;
  
    tem = expand_shift (RSHIFT_EXPR, mode, op0,
-                     build_int_cst (NULL_TREE,
-                                    GET_MODE_BITSIZE (mode) - 1, 0),
+                     build_int_cst (NULL_TREE, GET_MODE_BITSIZE (mode) - 1),
                       NULL_RTX, 0);
    tem = expand_and (mode, tem, op1, NULL_RTX);
    adj_operand
@@ -2916,8 +3262,7 @@ expand_mult_highpart_adjust (enum machine_mode mode, rtx adj_operand, rtx op0,
                      adj_operand);
  
    tem = expand_shift (RSHIFT_EXPR, mode, op1,
-                     build_int_cst (NULL_TREE,
-                                    GET_MODE_BITSIZE (mode) - 1, 0),
+                     build_int_cst (NULL_TREE, GET_MODE_BITSIZE (mode) - 1),
                       NULL_RTX, 0);
    tem = expand_and (mode, tem, op0, NULL_RTX);
    target = force_operand (gen_rtx_fmt_ee (adj_code, mode, adj_operand, tem),
@@ -2938,8 +3283,7 @@ extract_high_half (enum machine_mode mode, rtx op)
  
    wider_mode = GET_MODE_WIDER_MODE (mode);
    op = expand_shift (RSHIFT_EXPR, wider_mode, op,
-                    build_int_cst (NULL_TREE,
-                                   GET_MODE_BITSIZE (mode), 0), 0, 1);
+                    build_int_cst (NULL_TREE, GET_MODE_BITSIZE (mode)), 0, 1);
    return convert_modes (mode, wider_mode, op, 0);
  }
  
@@ -3052,8 +3396,7 @@ expand_mult_highpart (enum machine_mode mode, rtx op0,
    rtx op1, tem;
  
    /* We can't support modes wider than HOST_BITS_PER_INT.  */
-  if (GET_MODE_BITSIZE (mode) > HOST_BITS_PER_WIDE_INT)
-    abort ();
+  gcc_assert (GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT);
  
    op1 = gen_int_mode (cnst1, wider_mode);
    cnst1 &= GET_MODE_MASK (mode);
@@ -3081,8 +3424,8 @@ expand_mult_highpart (enum machine_mode mode, rtx op0,
      {
        /* See whether the specialized multiplication optabs are
          cheaper than the shift/add version.  */
-      tem = expand_mult_highpart_optab (mode, op0, op1, target,
-                                       unsignedp, alg.cost + extra_cost);
+      tem = expand_mult_highpart_optab (mode, op0, op1, target, unsignedp,
+                                       alg.cost.cost + extra_cost);
        if (tem)
         return tem;
  
@@ -3106,7 +3449,7 @@ expand_mult_highpart (enum machine_mode mode, rtx op0,
  static rtx
  expand_smod_pow2 (enum machine_mode mode, rtx op0, HOST_WIDE_INT d)
  {
-  unsigned HOST_WIDE_INT mask;
+  unsigned HOST_WIDE_INT masklow, maskhigh;
    rtx result, temp, shift, label;
    int logd;
  
@@ -3122,14 +3465,14 @@ expand_smod_pow2 (enum machine_mode mode, rtx op0, HOST_WIDE_INT d)
        if (signmask)
         {
           signmask = force_reg (mode, signmask);
-         mask = ((HOST_WIDE_INT) 1 << logd) - 1;
+         masklow = ((HOST_WIDE_INT) 1 << logd) - 1;
           shift = GEN_INT (GET_MODE_BITSIZE (mode) - logd);
  
           /* Use the rtx_cost of a LSHIFTRT instruction to determine
              which instruction sequence to use.  If logical right shifts
              are expensive the use 2 XORs, 2 SUBs and an AND, otherwise
              use a LSHIFTRT, 1 ADD, 1 SUB and an AND.  */
-            
+
           temp = gen_rtx_LSHIFTRT (mode, result, shift);
           if (lshr_optab->handlers[mode].insn_code == CODE_FOR_nothing
               || rtx_cost (temp, SET) > COSTS_N_INSNS (2))
@@ -3138,7 +3481,7 @@ expand_smod_pow2 (enum machine_mode mode, rtx op0, HOST_WIDE_INT d)
                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
               temp = expand_binop (mode, sub_optab, temp, signmask,
                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
-             temp = expand_binop (mode, and_optab, temp, GEN_INT (mask),
+             temp = expand_binop (mode, and_optab, temp, GEN_INT (masklow),
                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
               temp = expand_binop (mode, xor_optab, temp, signmask,
                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
@@ -3153,7 +3496,7 @@ expand_smod_pow2 (enum machine_mode mode, rtx op0, HOST_WIDE_INT d)
  
               temp = expand_binop (mode, add_optab, op0, signmask,
                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
-             temp = expand_binop (mode, and_optab, temp, GEN_INT (mask),
+             temp = expand_binop (mode, and_optab, temp, GEN_INT (masklow),
                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
               temp = expand_binop (mode, sub_optab, temp, signmask,
                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
@@ -3167,11 +3510,19 @@ expand_smod_pow2 (enum machine_mode mode, rtx op0, HOST_WIDE_INT d)
       can avoid an explicit compare operation in the following comparison
       against zero.  */
  
-  mask = (HOST_WIDE_INT) -1 << (GET_MODE_BITSIZE (mode) - 1)
-        | (((HOST_WIDE_INT) 1 << logd) - 1);
+  masklow = ((HOST_WIDE_INT) 1 << logd) - 1;
+  if (GET_MODE_BITSIZE (mode) <= HOST_BITS_PER_WIDE_INT)
+    {
+      masklow |= (HOST_WIDE_INT) -1 << (GET_MODE_BITSIZE (mode) - 1);
+      maskhigh = -1;
+    }
+  else
+    maskhigh = (HOST_WIDE_INT) -1
+                << (GET_MODE_BITSIZE (mode) - HOST_BITS_PER_WIDE_INT - 1);
  
-  temp = expand_binop (mode, and_optab, op0, GEN_INT (mask), result,
-                      1, OPTAB_LIB_WIDEN);
+  temp = expand_binop (mode, and_optab, op0,
+                      immed_double_const (masklow, maskhigh, mode),
+                      result, 1, OPTAB_LIB_WIDEN);
    if (temp != result)
      emit_move_insn (result, temp);
  
@@ -3180,9 +3531,11 @@ expand_smod_pow2 (enum machine_mode mode, rtx op0, HOST_WIDE_INT d)
  
    temp = expand_binop (mode, sub_optab, result, const1_rtx, result,
                        0, OPTAB_LIB_WIDEN);
-  mask = (HOST_WIDE_INT) -1 << logd;
-  temp = expand_binop (mode, ior_optab, temp, GEN_INT (mask), result,
-                      1, OPTAB_LIB_WIDEN);
+  masklow = (HOST_WIDE_INT) -1 << logd;
+  maskhigh = -1;
+  temp = expand_binop (mode, ior_optab, temp,
+                      immed_double_const (masklow, maskhigh, mode),
+                      result, 1, OPTAB_LIB_WIDEN);
    temp = expand_binop (mode, add_optab, temp, const1_rtx, result,
                        0, OPTAB_LIB_WIDEN);
    if (temp != result)
@@ -3202,7 +3555,7 @@ expand_sdiv_pow2 (enum machine_mode mode, rtx op0, HOST_WIDE_INT d)
    int logd;
  
    logd = floor_log2 (d);
-  shift = build_int_cst (NULL_TREE, logd, 0);
+  shift = build_int_cst (NULL_TREE, logd);
  
    if (d == 2 && BRANCH_COST >= 1)
      {
@@ -3218,6 +3571,11 @@ expand_sdiv_pow2 (enum machine_mode mode, rtx op0, HOST_WIDE_INT d)
      {
        rtx temp2;
  
+      /* ??? emit_conditional_move forces a stack adjustment via
+        compare_from_rtx so, if the sequence is discarded, it will
+        be lost.  Do it now instead.  */
+      do_pending_stack_adjust ();
+
        start_sequence ();
        temp2 = copy_to_mode_reg (mode, op0);
        temp = expand_binop (mode, add_optab, temp2, GEN_INT (d-1),
@@ -3249,7 +3607,7 @@ expand_sdiv_pow2 (enum machine_mode mode, rtx op0, HOST_WIDE_INT d)
                              NULL_RTX, 0, OPTAB_LIB_WIDEN);
        else
         temp = expand_shift (RSHIFT_EXPR, mode, temp,
-                            build_int_cst (NULL_TREE, ushift, 0),
+                            build_int_cst (NULL_TREE, ushift),
                              NULL_RTX, 1);
        temp = expand_binop (mode, add_optab, temp, op0, NULL_RTX,
                            0, OPTAB_LIB_WIDEN);
@@ -3527,7 +3885,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                       }
                     quotient = expand_shift (RSHIFT_EXPR, compute_mode, op0,
                                              build_int_cst (NULL_TREE,
-                                                           pre_shift, 0),
+                                                           pre_shift),
                                              tquotient, 1);
                   }
                 else if (size <= HOST_BITS_PER_WIDE_INT)
@@ -3558,8 +3916,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                             mh = choose_multiplier (d >> pre_shift, size,
                                                     size - pre_shift,
                                                     &ml, &post_shift, &dummy);
-                           if (mh)
-                             abort ();
+                           gcc_assert (!mh);
                           }
                         else
                           pre_shift = 0;
@@ -3585,15 +3942,14 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                                                 NULL_RTX);
                             t3 = expand_shift
                               (RSHIFT_EXPR, compute_mode, t2,
-                              build_int_cst (NULL_TREE, 1, 0),
+                              build_int_cst (NULL_TREE, 1),
                                NULL_RTX,1);
                             t4 = force_operand (gen_rtx_PLUS (compute_mode,
                                                               t1, t3),
                                                 NULL_RTX);
                             quotient = expand_shift
                               (RSHIFT_EXPR, compute_mode, t4,
-                              build_int_cst (NULL_TREE,
-                                             post_shift - 1, 0),
+                              build_int_cst (NULL_TREE, post_shift - 1),
                                tquotient, 1);
                           }
                         else
@@ -3606,7 +3962,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
  
                             t1 = expand_shift
                               (RSHIFT_EXPR, compute_mode, op0,
-                              build_int_cst (NULL_TREE, pre_shift, 0),
+                              build_int_cst (NULL_TREE, pre_shift),
                                NULL_RTX, 1);
                             extra_cost
                               = (shift_cost[compute_mode][pre_shift]
@@ -3618,8 +3974,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                               goto fail1;
                             quotient = expand_shift
                               (RSHIFT_EXPR, compute_mode, t2,
-                              build_int_cst (NULL_TREE,
-                                             post_shift, 0),
+                              build_int_cst (NULL_TREE, post_shift),
                                tquotient, 1);
                           }
                       }
@@ -3681,7 +4036,19 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                         if (remainder)
                           return gen_lowpart (mode, remainder);
                       }
-                   quotient = expand_sdiv_pow2 (compute_mode, op0, abs_d);
+
+                   if (sdiv_pow2_cheap[compute_mode]
+                       && ((sdiv_optab->handlers[compute_mode].insn_code
+                            != CODE_FOR_nothing)
+                           || (sdivmod_optab->handlers[compute_mode].insn_code
+                               != CODE_FOR_nothing)))
+                     quotient = expand_divmod (0, TRUNC_DIV_EXPR,
+                                               compute_mode, op0,
+                                               gen_int_mode (abs_d,
+                                                             compute_mode),
+                                               NULL_RTX, 0);
+                   else
+                     quotient = expand_sdiv_pow2 (compute_mode, op0, abs_d);
  
                     /* We have computed OP0 / abs(OP1).  If OP1 is negative,
                        negate the quotient.  */
@@ -3728,11 +4095,11 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                           goto fail1;
                         t2 = expand_shift
                           (RSHIFT_EXPR, compute_mode, t1,
-                          build_int_cst (NULL_TREE, post_shift, 0),
+                          build_int_cst (NULL_TREE, post_shift),
                            NULL_RTX, 0);
                         t3 = expand_shift
                           (RSHIFT_EXPR, compute_mode, op0,
-                          build_int_cst (NULL_TREE, size - 1, 0),
+                          build_int_cst (NULL_TREE, size - 1),
                            NULL_RTX, 0);
                         if (d < 0)
                           quotient
@@ -3767,11 +4134,11 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                                             NULL_RTX);
                         t3 = expand_shift
                           (RSHIFT_EXPR, compute_mode, t2,
-                          build_int_cst (NULL_TREE, post_shift, 0),
+                          build_int_cst (NULL_TREE, post_shift),
                            NULL_RTX, 0);
                         t4 = expand_shift
                           (RSHIFT_EXPR, compute_mode, op0,
-                          build_int_cst (NULL_TREE, size - 1, 0),
+                          build_int_cst (NULL_TREE, size - 1),
                            NULL_RTX, 0);
                         if (d < 0)
                           quotient
@@ -3828,7 +4195,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                       }
                     quotient = expand_shift
                       (RSHIFT_EXPR, compute_mode, op0,
-                      build_int_cst (NULL_TREE, pre_shift, 0),
+                      build_int_cst (NULL_TREE, pre_shift),
                        tquotient, 0);
                   }
                 else
@@ -3837,15 +4204,14 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
  
                     mh = choose_multiplier (d, size, size - 1,
                                             &ml, &post_shift, &lgup);
-                   if (mh)
-                     abort ();
+                   gcc_assert (!mh);
  
                     if (post_shift < BITS_PER_WORD
                         && size - 1 < BITS_PER_WORD)
                       {
                         t1 = expand_shift
                           (RSHIFT_EXPR, compute_mode, op0,
-                          build_int_cst (NULL_TREE, size - 1, 0),
+                          build_int_cst (NULL_TREE, size - 1),
                            NULL_RTX, 0);
                         t2 = expand_binop (compute_mode, xor_optab, op0, t1,
                                            NULL_RTX, 0, OPTAB_WIDEN);
@@ -3859,7 +4225,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                           {
                             t4 = expand_shift
                               (RSHIFT_EXPR, compute_mode, t3,
-                              build_int_cst (NULL_TREE, post_shift, 0),
+                              build_int_cst (NULL_TREE, post_shift),
                                NULL_RTX, 1);
                             quotient = expand_binop (compute_mode, xor_optab,
                                                      t4, t1, tquotient, 0,
@@ -3877,7 +4243,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                                    0, OPTAB_WIDEN);
                 nsign = expand_shift
                   (RSHIFT_EXPR, compute_mode, t2,
-                  build_int_cst (NULL_TREE, size - 1, 0),
+                  build_int_cst (NULL_TREE, size - 1),
                    NULL_RTX, 0);
                 t3 = force_operand (gen_rtx_MINUS (compute_mode, t1, nsign),
                                     NULL_RTX);
@@ -3992,8 +4358,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                 rtx t1, t2, t3;
                 unsigned HOST_WIDE_INT d = INTVAL (op1);
                 t1 = expand_shift (RSHIFT_EXPR, compute_mode, op0,
-                                  build_int_cst (NULL_TREE,
-                                                 floor_log2 (d), 0),
+                                  build_int_cst (NULL_TREE, floor_log2 (d)),
                                    tquotient, 1);
                 t2 = expand_binop (compute_mode, and_optab, op0,
                                    GEN_INT (d - 1),
@@ -4091,8 +4456,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
                 rtx t1, t2, t3;
                 unsigned HOST_WIDE_INT d = INTVAL (op1);
                 t1 = expand_shift (RSHIFT_EXPR, compute_mode, op0,
-                                  build_int_cst (NULL_TREE,
-                                                 floor_log2 (d), 0),
+                                  build_int_cst (NULL_TREE, floor_log2 (d)),
                                    tquotient, 0);
                 t2 = expand_binop (compute_mode, and_optab, op0,
                                    GEN_INT (d - 1),
@@ -4214,7 +4578,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
             pre_shift = floor_log2 (d & -d);
             ml = invert_mod2n (d >> pre_shift, size);
             t1 = expand_shift (RSHIFT_EXPR, compute_mode, op0,
-                              build_int_cst (NULL_TREE, pre_shift, 0),
+                              build_int_cst (NULL_TREE, pre_shift),
                                NULL_RTX, unsignedp);
             quotient = expand_mult (compute_mode, t1,
                                     gen_int_mode (ml, compute_mode),
@@ -4249,7 +4613,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
               }
             tem = plus_constant (op1, -1);
             tem = expand_shift (RSHIFT_EXPR, compute_mode, tem,
-                               build_int_cst (NULL_TREE, 1, 0),
+                               build_int_cst (NULL_TREE, 1),
                                 NULL_RTX, 1);
             do_cmp_and_jump (remainder, tem, LEU, compute_mode, label);
             expand_inc (quotient, const1_rtx);
@@ -4275,13 +4639,13 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
             abs_rem = expand_abs (compute_mode, remainder, NULL_RTX, 1, 0);
             abs_op1 = expand_abs (compute_mode, op1, NULL_RTX, 1, 0);
             tem = expand_shift (LSHIFT_EXPR, compute_mode, abs_rem,
-                               build_int_cst (NULL_TREE, 1, 0),
+                               build_int_cst (NULL_TREE, 1),
                                 NULL_RTX, 1);
             do_cmp_and_jump (tem, abs_op1, LTU, compute_mode, label);
             tem = expand_binop (compute_mode, xor_optab, op0, op1,
                                 NULL_RTX, 0, OPTAB_WIDEN);
             mask = expand_shift (RSHIFT_EXPR, compute_mode, tem,
-                                build_int_cst (NULL_TREE, size - 1, 0),
+                                build_int_cst (NULL_TREE, size - 1),
                                  NULL_RTX, 0);
             tem = expand_binop (compute_mode, xor_optab, mask, const1_rtx,
                                 NULL_RTX, 0, OPTAB_WIDEN);
@@ -4298,7 +4662,7 @@ expand_divmod (int rem_flag, enum tree_code code, enum machine_mode mode,
         return gen_lowpart (mode, rem_flag ? remainder : quotient);
  
        default:
-       abort ();
+       gcc_unreachable ();
        }
  
    if (quotient == 0)
@@ -4434,14 +4798,15 @@ make_tree (tree type, rtx x)
                      < HOST_BITS_PER_WIDE_INT)))
           hi = -1;
        
-       t = build_int_cst (type, INTVAL (x), hi);
+       t = build_int_cst_wide (type, INTVAL (x), hi);
         
         return t;
        }
        
      case CONST_DOUBLE:
        if (GET_MODE (x) == VOIDmode)
-       t = build_int_cst (type, CONST_DOUBLE_LOW (x), CONST_DOUBLE_HIGH (x));
+       t = build_int_cst_wide (type,
+                               CONST_DOUBLE_LOW (x), CONST_DOUBLE_HIGH (x));
        else
         {
           REAL_VALUE_TYPE d;
@@ -4564,13 +4929,7 @@ const_mult_add_overflow_p (rtx x, rtx mult, rtx add,
      {
        /* FIXME:It would be nice if we could step directly from this
          type to its sizetype equivalent.  */
-      mult_type = copy_node (type);
-      if (TYPE_CACHED_VALUES_P (mult_type))
-       {
-         /* Clear any set of cached values it has. */
-         TYPE_CACHED_VALUES_P (mult_type) = 0;
-         TYPE_CACHED_VALUES (mult_type) = NULL_TREE;
-       }
+      mult_type = build_distinct_type_copy (type);
        TYPE_IS_SIZETYPE (mult_type) = 1;
      }
  
@@ -4804,20 +5163,23 @@ emit_store_flag (rtx target, enum rtx_code code, rtx op0, rtx op1,
         = compare_from_rtx (op0, op1, code, unsignedp, mode, NULL_RTX);
        if (CONSTANT_P (comparison))
         {
-         if (GET_CODE (comparison) == CONST_INT)
+         switch (GET_CODE (comparison))
             {
+           case CONST_INT:
               if (comparison == const0_rtx)
                 return const0_rtx;
-           }
+             break;
+             
  #ifdef FLOAT_STORE_FLAG_VALUE
-         else if (GET_CODE (comparison) == CONST_DOUBLE)
-           {
+           case CONST_DOUBLE:
               if (comparison == CONST0_RTX (GET_MODE (comparison)))
                 return const0_rtx;
-           }
+             break;
  #endif
-         else
-           abort ();
+           default:
+             gcc_unreachable ();
+           }
+         
           if (normalizep == 1)
             return const1_rtx;
           if (normalizep == -1)
@@ -4892,14 +5254,14 @@ emit_store_flag (rtx target, enum rtx_code code, rtx op0, rtx op1,
             op0 = expand_shift (RSHIFT_EXPR, compare_mode, op0,
                                 size_int (GET_MODE_BITSIZE (compare_mode) - 1),
                                 subtarget, normalizep == 1);
-         else if (STORE_FLAG_VALUE & 1)
+         else
             {
+             gcc_assert (STORE_FLAG_VALUE & 1);
+             
               op0 = expand_and (compare_mode, op0, const1_rtx, subtarget);
               if (normalizep == -1)
                 op0 = expand_unop (compare_mode, neg_optab, op0, op0, 0);
             }
-         else
-           abort ();
  
           /* If we were converting to a smaller mode, do the
              conversion now.  */
@@ -5167,19 +5529,17 @@ do_cmp_and_jump (rtx arg1, rtx arg2, enum rtx_code op, enum machine_mode mode,
           /* do_jump_by_parts_equality_rtx compares with zero.  Luckily
              that's the only equality operations we do */
         case EQ:
-         if (arg2 != const0_rtx || mode != GET_MODE(arg1))
-           abort ();
+         gcc_assert (arg2 == const0_rtx && mode == GET_MODE(arg1));
           do_jump_by_parts_equality_rtx (arg1, label2, label);
           break;
  
         case NE:
-         if (arg2 != const0_rtx || mode != GET_MODE(arg1))
-           abort ();
+         gcc_assert (arg2 == const0_rtx && mode == GET_MODE(arg1));
           do_jump_by_parts_equality_rtx (arg1, label, label2);
           break;
  
         default:
-         abort ();
+         gcc_unreachable ();
         }
  
        emit_label (label2);