2007-08-04 Paul Thomas <pault@gcc.gnu.org>

[pf3gnuchains/gcc-fork.git] / gcc / optabs.c
diff --git a/gcc/optabs.c b/gcc/optabs.c

index bc85920..3741139 100644 (file)
--- a/gcc/optabs.c
+++ b/gcc/optabs.c
@@ -1,12 +1,13 @@
  /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
     Copyright (C) 1987, 1988, 1992, 1993, 1994, 1995, 1996, 1997, 1998,
-   1999, 2000, 2001, 2002, 2003, 2004, 2005 Free Software Foundation, Inc.
+   1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007
+   Free Software Foundation, Inc.
  
  This file is part of GCC.
  
  GCC is free software; you can redistribute it and/or modify it under
  the terms of the GNU General Public License as published by the Free
-Software Foundation; either version 2, or (at your option) any later
+Software Foundation; either version 3, or (at your option) any later
  version.
  
  GCC is distributed in the hope that it will be useful, but WITHOUT ANY
@@ -15,9 +16,8 @@ FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  for more details.
  
  You should have received a copy of the GNU General Public License
-along with GCC; see the file COPYING.  If not, write to the Free
-Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
-02110-1301, USA.  */
+along with GCC; see the file COPYING3.  If not see
+<http://www.gnu.org/licenses/>.  */
  
  
  #include "config.h"
@@ -125,10 +125,22 @@ static rtx expand_parity (enum machine_mode, rtx, rtx);
  static enum rtx_code get_rtx_code (enum tree_code, bool);
  static rtx vector_compare_rtx (tree, bool, enum insn_code);
  
+/* Current libcall id.  It doesn't matter what these are, as long
+   as they are unique to each libcall that is emitted.  */
+static HOST_WIDE_INT libcall_id = 0;
+
  #ifndef HAVE_conditional_trap
  #define HAVE_conditional_trap 0
  #define gen_conditional_trap(a,b) (gcc_unreachable (), NULL_RTX)
  #endif
+
+/* Prefixes for the current version of decimal floating point (BID vs. DPD) */
+#if ENABLE_DECIMAL_BID_FORMAT
+#define DECIMAL_PREFIX "bid_"
+#else
+#define DECIMAL_PREFIX "dpd_"
+#endif
+
  \f
  /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
     the result of operation CODE applied to OP0 (and OP1 if it is a binary
@@ -294,6 +306,12 @@ optab_for_tree_code (enum tree_code code, tree type)
      case REALIGN_LOAD_EXPR:
        return vec_realign_load_optab;
  
+    case WIDEN_SUM_EXPR:
+      return TYPE_UNSIGNED (type) ? usum_widen_optab : ssum_widen_optab;
+
+    case DOT_PROD_EXPR:
+      return TYPE_UNSIGNED (type) ? udot_prod_optab : sdot_prod_optab;
+
      case REDUC_MAX_EXPR:
        return TYPE_UNSIGNED (type) ? reduc_umax_optab : reduc_smax_optab;
  
@@ -309,13 +327,51 @@ optab_for_tree_code (enum tree_code code, tree type)
      case VEC_RSHIFT_EXPR:
        return vec_shr_optab;
  
+    case VEC_WIDEN_MULT_HI_EXPR:
+      return TYPE_UNSIGNED (type) ? 
+       vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
+
+    case VEC_WIDEN_MULT_LO_EXPR:
+      return TYPE_UNSIGNED (type) ? 
+       vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
+
+    case VEC_UNPACK_HI_EXPR:
+      return TYPE_UNSIGNED (type) ?
+       vec_unpacku_hi_optab : vec_unpacks_hi_optab;
+
+    case VEC_UNPACK_LO_EXPR:
+      return TYPE_UNSIGNED (type) ? 
+       vec_unpacku_lo_optab : vec_unpacks_lo_optab;
+
+    case VEC_UNPACK_FLOAT_HI_EXPR:
+      /* The signedness is determined from input operand.  */
+      return TYPE_UNSIGNED (type) ?
+       vec_unpacku_float_hi_optab : vec_unpacks_float_hi_optab;
+
+    case VEC_UNPACK_FLOAT_LO_EXPR:
+      /* The signedness is determined from input operand.  */
+      return TYPE_UNSIGNED (type) ? 
+       vec_unpacku_float_lo_optab : vec_unpacks_float_lo_optab;
+
+    case VEC_PACK_TRUNC_EXPR:
+      return vec_pack_trunc_optab;
+
+    case VEC_PACK_SAT_EXPR:
+      return TYPE_UNSIGNED (type) ? vec_pack_usat_optab : vec_pack_ssat_optab;
+
+    case VEC_PACK_FIX_TRUNC_EXPR:
+      /* The signedness is determined from output operand.  */
+      return TYPE_UNSIGNED (type) ?
+       vec_pack_ufix_trunc_optab : vec_pack_sfix_trunc_optab;
+
      default:
        break;
      }
  
-  trapv = flag_trapv && INTEGRAL_TYPE_P (type) && !TYPE_UNSIGNED (type);
+  trapv = INTEGRAL_TYPE_P (type) && TYPE_OVERFLOW_TRAPS (type);
    switch (code)
      {
+    case POINTER_PLUS_EXPR:
      case PLUS_EXPR:
        return trapv ? addv_optab : add_optab;
  
@@ -331,12 +387,172 @@ optab_for_tree_code (enum tree_code code, tree type)
      case ABS_EXPR:
        return trapv ? absv_optab : abs_optab;
  
+    case VEC_EXTRACT_EVEN_EXPR:
+      return vec_extract_even_optab;
+
+    case VEC_EXTRACT_ODD_EXPR:
+      return vec_extract_odd_optab;
+
+    case VEC_INTERLEAVE_HIGH_EXPR:
+      return vec_interleave_high_optab;
+
+    case VEC_INTERLEAVE_LOW_EXPR:
+      return vec_interleave_low_optab;
+
      default:
        return NULL;
      }
  }
  \f
  
+/* Expand vector widening operations.
+
+   There are two different classes of operations handled here:
+   1) Operations whose result is wider than all the arguments to the operation.
+      Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
+      In this case OP0 and optionally OP1 would be initialized,
+      but WIDE_OP wouldn't (not relevant for this case).
+   2) Operations whose result is of the same size as the last argument to the
+      operation, but wider than all the other arguments to the operation.
+      Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
+      In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
+
+   E.g, when called to expand the following operations, this is how
+   the arguments will be initialized:
+                                nops    OP0     OP1     WIDE_OP
+   widening-sum                 2       oprnd0  -       oprnd1          
+   widening-dot-product         3       oprnd0  oprnd1  oprnd2
+   widening-mult                2       oprnd0  oprnd1  -
+   type-promotion (vec-unpack)  1       oprnd0  -       -  */
+
+rtx
+expand_widen_pattern_expr (tree exp, rtx op0, rtx op1, rtx wide_op, rtx target,
+                           int unsignedp)
+{   
+  tree oprnd0, oprnd1, oprnd2;
+  enum machine_mode wmode = 0, tmode0, tmode1 = 0;
+  optab widen_pattern_optab;
+  int icode; 
+  enum machine_mode xmode0, xmode1 = 0, wxmode = 0;
+  rtx temp;
+  rtx pat;
+  rtx xop0, xop1, wxop;
+  int nops = TREE_OPERAND_LENGTH (exp);
+
+  oprnd0 = TREE_OPERAND (exp, 0);
+  tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
+  widen_pattern_optab =
+        optab_for_tree_code (TREE_CODE (exp), TREE_TYPE (oprnd0));
+  icode = (int) widen_pattern_optab->handlers[(int) tmode0].insn_code;
+  gcc_assert (icode != CODE_FOR_nothing);
+  xmode0 = insn_data[icode].operand[1].mode;
+
+  if (nops >= 2)
+    {
+      oprnd1 = TREE_OPERAND (exp, 1);
+      tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
+      xmode1 = insn_data[icode].operand[2].mode;
+    }
+
+  /* The last operand is of a wider mode than the rest of the operands.  */
+  if (nops == 2)
+    {
+      wmode = tmode1;
+      wxmode = xmode1;
+    }
+  else if (nops == 3)
+    {
+      gcc_assert (tmode1 == tmode0);
+      gcc_assert (op1);
+      oprnd2 = TREE_OPERAND (exp, 2);
+      wmode = TYPE_MODE (TREE_TYPE (oprnd2));
+      wxmode = insn_data[icode].operand[3].mode;
+    }
+
+  if (!wide_op)
+    wmode = wxmode = insn_data[icode].operand[0].mode;
+
+  if (!target
+      || ! (*insn_data[icode].operand[0].predicate) (target, wmode))
+    temp = gen_reg_rtx (wmode);
+  else
+    temp = target;
+
+  xop0 = op0;
+  xop1 = op1;
+  wxop = wide_op;
+
+  /* In case the insn wants input operands in modes different from
+     those of the actual operands, convert the operands.  It would
+     seem that we don't need to convert CONST_INTs, but we do, so
+     that they're properly zero-extended, sign-extended or truncated
+     for their mode.  */
+
+  if (GET_MODE (op0) != xmode0 && xmode0 != VOIDmode)
+    xop0 = convert_modes (xmode0,
+                          GET_MODE (op0) != VOIDmode
+                          ? GET_MODE (op0)
+                          : tmode0,
+                          xop0, unsignedp);
+
+  if (op1)
+    if (GET_MODE (op1) != xmode1 && xmode1 != VOIDmode)
+      xop1 = convert_modes (xmode1,
+                            GET_MODE (op1) != VOIDmode
+                            ? GET_MODE (op1)
+                            : tmode1,
+                            xop1, unsignedp);
+
+  if (wide_op)
+    if (GET_MODE (wide_op) != wxmode && wxmode != VOIDmode)
+      wxop = convert_modes (wxmode,
+                            GET_MODE (wide_op) != VOIDmode
+                            ? GET_MODE (wide_op)
+                            : wmode,
+                            wxop, unsignedp);
+
+  /* Now, if insn's predicates don't allow our operands, put them into
+     pseudo regs.  */
+
+  if (! (*insn_data[icode].operand[1].predicate) (xop0, xmode0)
+      && xmode0 != VOIDmode)
+    xop0 = copy_to_mode_reg (xmode0, xop0);
+
+  if (op1)
+    {
+      if (! (*insn_data[icode].operand[2].predicate) (xop1, xmode1)
+          && xmode1 != VOIDmode)
+        xop1 = copy_to_mode_reg (xmode1, xop1);
+
+      if (wide_op)
+        {
+          if (! (*insn_data[icode].operand[3].predicate) (wxop, wxmode)
+              && wxmode != VOIDmode)
+            wxop = copy_to_mode_reg (wxmode, wxop);
+
+          pat = GEN_FCN (icode) (temp, xop0, xop1, wxop);
+        }
+      else
+        pat = GEN_FCN (icode) (temp, xop0, xop1);
+    }
+  else
+    {
+      if (wide_op)
+        {
+          if (! (*insn_data[icode].operand[2].predicate) (wxop, wxmode)
+              && wxmode != VOIDmode)
+            wxop = copy_to_mode_reg (wxmode, wxop);
+
+          pat = GEN_FCN (icode) (temp, xop0, wxop);
+        }
+      else
+        pat = GEN_FCN (icode) (temp, xop0);
+    }
+
+  emit_insn (pat);
+  return temp;
+}
+
  /* Generate code to perform an operation specified by TERNARY_OPTAB
     on operands OP0, OP1 and OP2, with result having machine-mode MODE.
  
@@ -427,9 +643,14 @@ simplify_expand_binop (enum machine_mode mode, optab binoptab,
                        enum optab_methods methods)
  {
    if (CONSTANT_P (op0) && CONSTANT_P (op1))
-    return simplify_gen_binary (binoptab->code, mode, op0, op1);
-  else
-    return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
+    {
+      rtx x = simplify_binary_operation (binoptab->code, mode, op0, op1);
+
+      if (x)
+       return x;
+    }
+
+  return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
  }
  
  /* Like simplify_expand_binop, but always put the result in TARGET.
@@ -482,12 +703,12 @@ expand_vec_shift_expr (tree vec_shift_expr, rtx target)
    mode1 = insn_data[icode].operand[1].mode;
    mode2 = insn_data[icode].operand[2].mode;
  
-  rtx_op1 = expand_expr (vec_oprnd, NULL_RTX, VOIDmode, EXPAND_NORMAL);
+  rtx_op1 = expand_normal (vec_oprnd);
    if (!(*insn_data[icode].operand[1].predicate) (rtx_op1, mode1)
        && mode1 != VOIDmode)
      rtx_op1 = force_reg (mode1, rtx_op1);
  
-  rtx_op2 = expand_expr (shift_oprnd, NULL_RTX, VOIDmode, EXPAND_NORMAL);
+  rtx_op2 = expand_normal (shift_oprnd);
    if (!(*insn_data[icode].operand[2].predicate) (rtx_op2, mode2)
        && mode2 != VOIDmode)
      rtx_op2 = force_reg (mode2, rtx_op2);
@@ -800,8 +1021,10 @@ expand_doubleword_shift (enum machine_mode op1_mode, optab binoptab,
    subword_label = gen_label_rtx ();
    done_label = gen_label_rtx ();
  
+  NO_DEFER_POP;
    do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
                            0, 0, subword_label);
+  OK_DEFER_POP;
  
    if (!expand_superword_shift (binoptab, outof_input, superword_op1,
                                outof_target, into_target,
@@ -998,10 +1221,9 @@ expand_simple_binop (enum machine_mode mode, enum rtx_code code, rtx op0,
    return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
  }
  
-
  /* Return whether OP0 and OP1 should be swapped when expanding a commutative
     binop.  Order them according to commutative_operand_precedence and, if
-   possible, try to put TARGET first.  */
+   possible, try to put TARGET or a pseudo first.  */
  static bool
  swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
  {
@@ -1014,12 +1236,122 @@ swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
    if (op0_prec > op1_prec)
      return false;
  
-  /* With equal precedence, both orders are ok, but try to put the
-     target first.  */
-  return target && rtx_equal_p (op1, target);
+  /* With equal precedence, both orders are ok, but it is better if the
+     first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
+  if (target == 0 || REG_P (target))
+    return (REG_P (op1) && !REG_P (op0)) || target == op1;
+  else
+    return rtx_equal_p (op1, target);
  }
  
  
+/* Helper function for expand_binop: handle the case where there
+   is an insn that directly implements the indicated operation.
+   Returns null if this is not possible.  */
+static rtx
+expand_binop_directly (enum machine_mode mode, optab binoptab,
+                      rtx op0, rtx op1,
+                      rtx target, int unsignedp, enum optab_methods methods,
+                      int commutative_op, rtx last)
+{
+  int icode = (int) binoptab->handlers[(int) mode].insn_code;
+  enum machine_mode mode0 = insn_data[icode].operand[1].mode;
+  enum machine_mode mode1 = insn_data[icode].operand[2].mode;
+  enum machine_mode tmp_mode;
+  rtx pat;
+  rtx xop0 = op0, xop1 = op1;
+  rtx temp;
+  
+  if (target)
+    temp = target;
+  else
+    temp = gen_reg_rtx (mode);
+  
+  /* If it is a commutative operator and the modes would match
+     if we would swap the operands, we can save the conversions.  */
+  if (commutative_op)
+    {
+      if (GET_MODE (op0) != mode0 && GET_MODE (op1) != mode1
+         && GET_MODE (op0) == mode1 && GET_MODE (op1) == mode0)
+       {
+         rtx tmp;
+         
+         tmp = op0; op0 = op1; op1 = tmp;
+         tmp = xop0; xop0 = xop1; xop1 = tmp;
+       }
+    }
+  
+  /* In case the insn wants input operands in modes different from
+     those of the actual operands, convert the operands.  It would
+     seem that we don't need to convert CONST_INTs, but we do, so
+     that they're properly zero-extended, sign-extended or truncated
+     for their mode.  */
+  
+  if (GET_MODE (op0) != mode0 && mode0 != VOIDmode)
+    xop0 = convert_modes (mode0,
+                         GET_MODE (op0) != VOIDmode
+                         ? GET_MODE (op0)
+                         : mode,
+                         xop0, unsignedp);
+  
+  if (GET_MODE (op1) != mode1 && mode1 != VOIDmode)
+    xop1 = convert_modes (mode1,
+                         GET_MODE (op1) != VOIDmode
+                         ? GET_MODE (op1)
+                         : mode,
+                         xop1, unsignedp);
+  
+  /* Now, if insn's predicates don't allow our operands, put them into
+     pseudo regs.  */
+  
+  if (!insn_data[icode].operand[1].predicate (xop0, mode0)
+      && mode0 != VOIDmode)
+    xop0 = copy_to_mode_reg (mode0, xop0);
+  
+  if (!insn_data[icode].operand[2].predicate (xop1, mode1)
+      && mode1 != VOIDmode)
+    xop1 = copy_to_mode_reg (mode1, xop1);
+  
+  if (binoptab == vec_pack_trunc_optab 
+      || binoptab == vec_pack_usat_optab
+      || binoptab == vec_pack_ssat_optab
+      || binoptab == vec_pack_ufix_trunc_optab
+      || binoptab == vec_pack_sfix_trunc_optab)
+    {
+      /* The mode of the result is different then the mode of the
+        arguments.  */
+      tmp_mode = insn_data[icode].operand[0].mode;
+      if (GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
+       return 0;
+    }
+  else
+    tmp_mode = mode;
+
+  if (!insn_data[icode].operand[0].predicate (temp, tmp_mode))
+    temp = gen_reg_rtx (tmp_mode);
+  
+  pat = GEN_FCN (icode) (temp, xop0, xop1);
+  if (pat)
+    {
+      /* If PAT is composed of more than one insn, try to add an appropriate
+        REG_EQUAL note to it.  If we can't because TEMP conflicts with an
+        operand, call expand_binop again, this time without a target.  */
+      if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
+         && ! add_equal_note (pat, temp, binoptab->code, xop0, xop1))
+       {
+         delete_insns_since (last);
+         return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
+                              unsignedp, methods);
+       }
+      
+      emit_insn (pat);
+      return temp;
+    }
+
+  delete_insns_since (last);
+  return NULL_RTX;
+}
+
  /* Generate code to perform an operation specified by BINOPTAB
     on operands OP0 and OP1, with result having machine-mode MODE.
  
@@ -1049,7 +1381,6 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
                   || binoptab->code == ROTATERT);
    rtx entry_last = get_last_insn ();
    rtx last;
-  bool first_pass_p;
  
    class = GET_MODE_CLASS (mode);
  
@@ -1083,7 +1414,10 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
    /* Record where to delete back to if we backtrack.  */
    last = get_last_insn ();
  
-  /* If operation is commutative, canonicalize the order of the operands.  */
+  /* If operation is commutative,
+     try to make the first operand a register.
+     Even better, try to make it the same as the target.
+     Also try to make the last operand a constant.  */
    if (GET_RTX_CLASS (binoptab->code) == RTX_COMM_ARITH
        || binoptab == smul_widen_optab
        || binoptab == umul_widen_optab
@@ -1091,6 +1425,7 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
        || binoptab == umul_highpart_optab)
      {
        commutative_op = 1;
+
        if (swap_commutative_operands_with_target (target, op0, op1))
         {
           temp = op1;
@@ -1099,113 +1434,50 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
         }
      }
  
- retry:
-
    /* If we can do it with a three-operand insn, do so.  */
  
    if (methods != OPTAB_MUST_WIDEN
        && binoptab->handlers[(int) mode].insn_code != CODE_FOR_nothing)
      {
-      int icode = (int) binoptab->handlers[(int) mode].insn_code;
-      enum machine_mode mode0 = insn_data[icode].operand[1].mode;
-      enum machine_mode mode1 = insn_data[icode].operand[2].mode;
-      rtx pat;
-      rtx xop0 = op0, xop1 = op1;
-
-      if (target)
-       temp = target;
-      else
-       temp = gen_reg_rtx (mode);
-
-      /* If it is a commutative operator and the modes would match
-        if we would swap the operands, we can save the conversions.  */
-      if (commutative_op)
-       {
-         if (GET_MODE (op0) != mode0 && GET_MODE (op1) != mode1
-             && GET_MODE (op0) == mode1 && GET_MODE (op1) == mode0)
-           {
-             rtx tmp;
-
-             tmp = op0; op0 = op1; op1 = tmp;
-             tmp = xop0; xop0 = xop1; xop1 = tmp;
-           }
-       }
-
-      /* In case the insn wants input operands in modes different from
-        those of the actual operands, convert the operands.  It would
-        seem that we don't need to convert CONST_INTs, but we do, so
-        that they're properly zero-extended, sign-extended or truncated
-        for their mode.  */
-
-      if (GET_MODE (op0) != mode0 && mode0 != VOIDmode)
-       xop0 = convert_modes (mode0,
-                             GET_MODE (op0) != VOIDmode
-                             ? GET_MODE (op0)
-                             : mode,
-                             xop0, unsignedp);
-
-      if (GET_MODE (op1) != mode1 && mode1 != VOIDmode)
-       xop1 = convert_modes (mode1,
-                             GET_MODE (op1) != VOIDmode
-                             ? GET_MODE (op1)
-                             : mode,
-                             xop1, unsignedp);
-
-      /* Now, if insn's predicates don't allow our operands, put them into
-        pseudo regs.  */
-
-      if (!insn_data[icode].operand[1].predicate (xop0, mode0)
-         && mode0 != VOIDmode)
-       xop0 = copy_to_mode_reg (mode0, xop0);
-
-      if (!insn_data[icode].operand[2].predicate (xop1, mode1)
-         && mode1 != VOIDmode)
-       xop1 = copy_to_mode_reg (mode1, xop1);
-
-      if (!insn_data[icode].operand[0].predicate (temp, mode))
-       temp = gen_reg_rtx (mode);
-
-      pat = GEN_FCN (icode) (temp, xop0, xop1);
-      if (pat)
-       {
-         /* If PAT is composed of more than one insn, try to add an appropriate
-            REG_EQUAL note to it.  If we can't because TEMP conflicts with an
-            operand, call ourselves again, this time without a target.  */
-         if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
-             && ! add_equal_note (pat, temp, binoptab->code, xop0, xop1))
-           {
-             delete_insns_since (last);
-             return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
-                                  unsignedp, methods);
-           }
-
-         emit_insn (pat);
-         return temp;
-       }
-      else
-       delete_insns_since (last);
+      temp = expand_binop_directly (mode, binoptab, op0, op1, target,
+                                   unsignedp, methods, commutative_op, last);
+      if (temp)
+       return temp;
      }
  
-  /* If we were trying to rotate by a constant value, and that didn't
-     work, try rotating the other direction before falling back to
-     shifts and bitwise-or.  */
-  if (first_pass_p
-      && (binoptab == rotl_optab || binoptab == rotr_optab)
-      && class == MODE_INT
-      && GET_CODE (op1) == CONST_INT
-      && INTVAL (op1) > 0
-      && (unsigned int) INTVAL (op1) < GET_MODE_BITSIZE (mode))
+  /* If we were trying to rotate, and that didn't work, try rotating
+     the other direction before falling back to shifts and bitwise-or.  */
+  if (((binoptab == rotl_optab
+       && rotr_optab->handlers[(int) mode].insn_code != CODE_FOR_nothing)
+       || (binoptab == rotr_optab
+          && rotl_optab->handlers[(int) mode].insn_code != CODE_FOR_nothing))
+      && class == MODE_INT)
      {
-      first_pass_p = false;
-      op1 = GEN_INT (GET_MODE_BITSIZE (mode) - INTVAL (op1));
-      binoptab = binoptab == rotl_optab ? rotr_optab : rotl_optab;
-      goto retry;
+      optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
+      rtx newop1;
+      unsigned int bits = GET_MODE_BITSIZE (mode);
+
+      if (GET_CODE (op1) == CONST_INT)
+       newop1 = GEN_INT (bits - INTVAL (op1));
+      else if (targetm.shift_truncation_mask (mode) == bits - 1)
+       newop1 = negate_rtx (mode, op1);
+      else
+       newop1 = expand_binop (mode, sub_optab,
+                              GEN_INT (bits), op1,
+                              NULL_RTX, unsignedp, OPTAB_DIRECT);
+                                  
+      temp = expand_binop_directly (mode, otheroptab, op0, newop1,
+                                   target, unsignedp, methods,
+                                   commutative_op, last);
+      if (temp)
+       return temp;
      }
  
    /* If this is a multiply, see if we can do a widening operation that
       takes operands of this mode and makes a wider mode.  */
  
-  if (binoptab == smul_optab && GET_MODE_WIDER_MODE (mode) != VOIDmode
+  if (binoptab == smul_optab
+      && GET_MODE_WIDER_MODE (mode) != VOIDmode
        && (((unsignedp ? umul_widen_optab : smul_widen_optab)
            ->handlers[(int) GET_MODE_WIDER_MODE (mode)].insn_code)
           != CODE_FOR_nothing))
@@ -1229,9 +1501,10 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
       can open-code the operation.  Check for a widening multiply at the
       wider mode as well.  */
  
-  if ((class == MODE_INT || class == MODE_FLOAT || class == MODE_COMPLEX_FLOAT)
+  if (CLASS_HAS_WIDER_MODES_P (class)
        && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
-    for (wider_mode = GET_MODE_WIDER_MODE (mode); wider_mode != VOIDmode;
+    for (wider_mode = GET_MODE_WIDER_MODE (mode);
+        wider_mode != VOIDmode;
          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
        {
         if (binoptab->handlers[(int) wider_mode].insn_code != CODE_FOR_nothing
@@ -1391,7 +1664,7 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
           if (expand_doubleword_shift (op1_mode, binoptab,
                                        outof_input, into_input, op1,
                                        outof_target, into_target,
-                                      unsignedp, methods, shift_mask))
+                                      unsignedp, next_methods, shift_mask))
             {
               insns = get_insns ();
               end_sequence ();
@@ -1412,7 +1685,7 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
        && ashl_optab->handlers[(int) word_mode].insn_code != CODE_FOR_nothing
        && lshr_optab->handlers[(int) word_mode].insn_code != CODE_FOR_nothing)
      {
-      rtx insns, equiv_value;
+      rtx insns;
        rtx into_target, outof_target;
        rtx into_input, outof_input;
        rtx inter;
@@ -1512,20 +1785,12 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
  
        if (inter != 0)
         {
-         if (binoptab->code != UNKNOWN)
-           equiv_value = gen_rtx_fmt_ee (binoptab->code, mode, op0, op1);
-         else
-           equiv_value = 0;
-
-         /* We can't make this a no conflict block if this is a word swap,
-            because the word swap case fails if the input and output values
-            are in the same register.  */
-         if (shift_count != BITS_PER_WORD)
-           emit_no_conflict_block (insns, target, op0, op1, equiv_value);
-         else
-           emit_insn (insns);
-
-
+         /* One may be tempted to wrap the insns in a REG_NO_CONFLICT
+            block to help the register allocator a bit.  But a multi-word
+            rotate will need all the input bits when setting the output
+            bits, so there clearly is a conflict between the input and
+            output registers.  So we can't use a no-conflict block here.  */
+         emit_insn (insns);
           return target;
         }
      }
@@ -1714,10 +1979,10 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
  
        if (shift_op)
         {
-         op1_mode = word_mode;
+         op1_mode = targetm.libgcc_shift_count_mode ();
           /* Specify unsigned here,
              since negative shift counts are meaningless.  */
-         op1x = convert_to_mode (word_mode, op1, 1);
+         op1x = convert_to_mode (op1_mode, op1, 1);
         }
  
        if (GET_MODE (op0) != VOIDmode
@@ -1760,9 +2025,10 @@ expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
    /* Look for a wider mode of the same class for which it appears we can do
       the operation.  */
  
-  if (class == MODE_INT || class == MODE_FLOAT || class == MODE_COMPLEX_FLOAT)
+  if (CLASS_HAS_WIDER_MODES_P (class))
      {
-      for (wider_mode = GET_MODE_WIDER_MODE (mode); wider_mode != VOIDmode;
+      for (wider_mode = GET_MODE_WIDER_MODE (mode);
+          wider_mode != VOIDmode;
            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
         {
           if ((binoptab->handlers[(int) wider_mode].insn_code
@@ -1934,9 +2200,10 @@ expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
  
    /* It can't be done in this mode.  Can we do it in a wider mode?  */
  
-  if (class == MODE_INT || class == MODE_FLOAT || class == MODE_COMPLEX_FLOAT)
+  if (CLASS_HAS_WIDER_MODES_P (class))
      {
-      for (wider_mode = GET_MODE_WIDER_MODE (mode); wider_mode != VOIDmode;
+      for (wider_mode = GET_MODE_WIDER_MODE (mode);
+          wider_mode != VOIDmode;
            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
         {
           if (unoptab->handlers[(int) wider_mode].insn_code
@@ -2056,9 +2323,10 @@ expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
  
    /* It can't be done in this mode.  Can we do it in a wider mode?  */
  
-  if (class == MODE_INT || class == MODE_FLOAT || class == MODE_COMPLEX_FLOAT)
+  if (CLASS_HAS_WIDER_MODES_P (class))
      {
-      for (wider_mode = GET_MODE_WIDER_MODE (mode); wider_mode != VOIDmode;
+      for (wider_mode = GET_MODE_WIDER_MODE (mode);
+          wider_mode != VOIDmode;
            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
         {
           if (binoptab->handlers[(int) wider_mode].insn_code
@@ -2155,10 +2423,11 @@ static rtx
  widen_clz (enum machine_mode mode, rtx op0, rtx target)
  {
    enum mode_class class = GET_MODE_CLASS (mode);
-  if (class == MODE_INT || class == MODE_FLOAT || class == MODE_COMPLEX_FLOAT)
+  if (CLASS_HAS_WIDER_MODES_P (class))
      {
        enum machine_mode wider_mode;
-      for (wider_mode = GET_MODE_WIDER_MODE (mode); wider_mode != VOIDmode;
+      for (wider_mode = GET_MODE_WIDER_MODE (mode);
+          wider_mode != VOIDmode;
            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
         {
           if (clz_optab->handlers[(int) wider_mode].insn_code
@@ -2187,13 +2456,80 @@ widen_clz (enum machine_mode mode, rtx op0, rtx target)
    return 0;
  }
  
+/* Try calculating
+       (bswap:narrow x)
+   as
+       (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
+static rtx
+widen_bswap (enum machine_mode mode, rtx op0, rtx target)
+{
+  enum mode_class class = GET_MODE_CLASS (mode);
+  enum machine_mode wider_mode;
+  rtx x, last;
+
+  if (!CLASS_HAS_WIDER_MODES_P (class))
+    return NULL_RTX;
+
+  for (wider_mode = GET_MODE_WIDER_MODE (mode);
+       wider_mode != VOIDmode;
+       wider_mode = GET_MODE_WIDER_MODE (wider_mode))
+    if (bswap_optab->handlers[wider_mode].insn_code != CODE_FOR_nothing)
+      goto found;
+  return NULL_RTX;
+
+ found:
+  last = get_last_insn ();
+
+  x = widen_operand (op0, wider_mode, mode, true, true);
+  x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
+
+  if (x != 0)
+    x = expand_shift (RSHIFT_EXPR, wider_mode, x,
+                     size_int (GET_MODE_BITSIZE (wider_mode)
+                               - GET_MODE_BITSIZE (mode)),
+                     NULL_RTX, true);
+
+  if (x != 0)
+    {
+      if (target == 0)
+       target = gen_reg_rtx (mode);
+      emit_move_insn (target, gen_lowpart (mode, x));
+    }
+  else
+    delete_insns_since (last);
+
+  return target;
+}
+
+/* Try calculating bswap as two bswaps of two word-sized operands.  */
+
+static rtx
+expand_doubleword_bswap (enum machine_mode mode, rtx op, rtx target)
+{
+  rtx t0, t1;
+
+  t1 = expand_unop (word_mode, bswap_optab,
+                   operand_subword_force (op, 0, mode), NULL_RTX, true);
+  t0 = expand_unop (word_mode, bswap_optab,
+                   operand_subword_force (op, 1, mode), NULL_RTX, true);
+
+  if (target == 0)
+    target = gen_reg_rtx (mode);
+  if (REG_P (target))
+    emit_insn (gen_rtx_CLOBBER (VOIDmode, target));
+  emit_move_insn (operand_subword (target, 0, 1, mode), t0);
+  emit_move_insn (operand_subword (target, 1, 1, mode), t1);
+
+  return target;
+}
+
  /* Try calculating (parity x) as (and (popcount x) 1), where
     popcount can also be done in a wider mode.  */
  static rtx
  expand_parity (enum machine_mode mode, rtx op0, rtx target)
  {
    enum mode_class class = GET_MODE_CLASS (mode);
-  if (class == MODE_INT || class == MODE_FLOAT || class == MODE_COMPLEX_FLOAT)
+  if (CLASS_HAS_WIDER_MODES_P (class))
      {
        enum machine_mode wider_mode;
        for (wider_mode = mode; wider_mode != VOIDmode;
@@ -2425,8 +2761,27 @@ expand_unop (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
         goto try_libcall;
      }
  
-  if (class == MODE_INT || class == MODE_FLOAT || class == MODE_COMPLEX_FLOAT)
-    for (wider_mode = GET_MODE_WIDER_MODE (mode); wider_mode != VOIDmode;
+  /* Widening (or narrowing) bswap needs special treatment.  */
+  if (unoptab == bswap_optab)
+    {
+      temp = widen_bswap (mode, op0, target);
+      if (temp)
+       return temp;
+
+      if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
+         && unoptab->handlers[word_mode].insn_code != CODE_FOR_nothing)
+       {
+         temp = expand_doubleword_bswap (mode, op0, target);
+         if (temp)
+           return temp;
+       }
+
+      goto try_libcall;
+    }
+
+  if (CLASS_HAS_WIDER_MODES_P (class))
+    for (wider_mode = GET_MODE_WIDER_MODE (mode);
+        wider_mode != VOIDmode;
          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
        {
         if (unoptab->handlers[(int) wider_mode].insn_code != CODE_FOR_nothing)
@@ -2447,7 +2802,9 @@ expand_unop (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
  
             if (temp)
               {
-               if (class != MODE_INT)
+               if (class != MODE_INT
+                   || !TRULY_NOOP_TRUNCATION (GET_MODE_BITSIZE (mode),
+                                              GET_MODE_BITSIZE (wider_mode)))
                   {
                     if (target == 0)
                       target = gen_reg_rtx (mode);
@@ -2500,7 +2857,7 @@ expand_unop (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
    if (unoptab->code == NEG)
      {
        /* Try negating floating point values by flipping the sign bit.  */
-      if (class == MODE_FLOAT)
+      if (SCALAR_FLOAT_MODE_P (mode))
         {
           temp = expand_absneg_bit (NEG, mode, op0, target);
           if (temp)
@@ -2555,16 +2912,17 @@ expand_unop (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
  
        target = gen_reg_rtx (outmode);
        emit_libcall_block (insns, target, value,
-                         gen_rtx_fmt_e (unoptab->code, mode, op0));
+                         gen_rtx_fmt_e (unoptab->code, outmode, op0));
  
        return target;
      }
  
    /* It can't be done in this mode.  Can we do it in a wider mode?  */
  
-  if (class == MODE_INT || class == MODE_FLOAT || class == MODE_COMPLEX_FLOAT)
+  if (CLASS_HAS_WIDER_MODES_P (class))
      {
-      for (wider_mode = GET_MODE_WIDER_MODE (mode); wider_mode != VOIDmode;
+      for (wider_mode = GET_MODE_WIDER_MODE (mode);
+          wider_mode != VOIDmode;
            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
         {
           if ((unoptab->handlers[(int) wider_mode].insn_code
@@ -2652,7 +3010,7 @@ expand_abs_nojump (enum machine_mode mode, rtx op0, rtx target,
      return temp;
  
    /* For floating point modes, try clearing the sign bit.  */
-  if (GET_MODE_CLASS (mode) == MODE_FLOAT)
+  if (SCALAR_FLOAT_MODE_P (mode))
      {
        temp = expand_absneg_bit (ABS, mode, op0, target);
        if (temp)
@@ -2731,15 +3089,8 @@ expand_abs (enum machine_mode mode, rtx op0, rtx target,
    emit_move_insn (target, op0);
    NO_DEFER_POP;
  
-  /* If this mode is an integer too wide to compare properly,
-     compare word by word.  Rely on CSE to optimize constant cases.  */
-  if (GET_MODE_CLASS (mode) == MODE_INT
-      && ! can_compare_p (GE, mode, ccp_jump))
-    do_jump_by_parts_greater_rtx (mode, 0, target, const0_rtx,
-                                 NULL_RTX, op1);
-  else
-    do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
-                            NULL_RTX, NULL_RTX, op1);
+  do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
+                          NULL_RTX, NULL_RTX, op1);
  
    op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
                       target, target, 0);
@@ -2760,63 +3111,79 @@ expand_copysign_absneg (enum machine_mode mode, rtx op0, rtx op1, rtx target,
                         int bitpos, bool op0_is_abs)
  {
    enum machine_mode imode;
-  HOST_WIDE_INT hi, lo;
-  int word;
-  rtx label;
+  int icode;
+  rtx sign, label;
  
    if (target == op1)
      target = NULL_RTX;
  
-  if (!op0_is_abs)
+  /* Check if the back end provides an insn that handles signbit for the
+     argument's mode. */
+  icode = (int) signbit_optab->handlers [(int) mode].insn_code;
+  if (icode != CODE_FOR_nothing)
      {
-      op0 = expand_unop (mode, abs_optab, op0, target, 0);
-      if (op0 == NULL)
-       return NULL_RTX;
-      target = op0;
+      imode = insn_data[icode].operand[0].mode;
+      sign = gen_reg_rtx (imode);
+      emit_unop_insn (icode, sign, op1, UNKNOWN);
      }
    else
      {
-      if (target == NULL_RTX)
-        target = copy_to_reg (op0);
+      HOST_WIDE_INT hi, lo;
+
+      if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
+       {
+         imode = int_mode_for_mode (mode);
+         if (imode == BLKmode)
+           return NULL_RTX;
+         op1 = gen_lowpart (imode, op1);
+       }
        else
-       emit_move_insn (target, op0);
-    }
+       {
+         int word;
  
-  if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
-    {
-      imode = int_mode_for_mode (mode);
-      if (imode == BLKmode)
-       return NULL_RTX;
-      op1 = gen_lowpart (imode, op1);
-    }
-  else
-    {
-      imode = word_mode;
-      if (FLOAT_WORDS_BIG_ENDIAN)
-       word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
+         imode = word_mode;
+         if (FLOAT_WORDS_BIG_ENDIAN)
+           word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
+         else
+           word = bitpos / BITS_PER_WORD;
+         bitpos = bitpos % BITS_PER_WORD;
+         op1 = operand_subword_force (op1, word, mode);
+       }
+
+      if (bitpos < HOST_BITS_PER_WIDE_INT)
+       {
+         hi = 0;
+         lo = (HOST_WIDE_INT) 1 << bitpos;
+       }
        else
-       word = bitpos / BITS_PER_WORD;
-      bitpos = bitpos % BITS_PER_WORD;
-      op1 = operand_subword_force (op1, word, mode);
+       {
+         hi = (HOST_WIDE_INT) 1 << (bitpos - HOST_BITS_PER_WIDE_INT);
+         lo = 0;
+       }
+
+      sign = gen_reg_rtx (imode);
+      sign = expand_binop (imode, and_optab, op1,
+                          immed_double_const (lo, hi, imode),
+                          NULL_RTX, 1, OPTAB_LIB_WIDEN);
      }
  
-  if (bitpos < HOST_BITS_PER_WIDE_INT)
+  if (!op0_is_abs)
      {
-      hi = 0;
-      lo = (HOST_WIDE_INT) 1 << bitpos;
+      op0 = expand_unop (mode, abs_optab, op0, target, 0);
+      if (op0 == NULL)
+       return NULL_RTX;
+      target = op0;
      }
    else
      {
-      hi = (HOST_WIDE_INT) 1 << (bitpos - HOST_BITS_PER_WIDE_INT);
-      lo = 0;
+      if (target == NULL_RTX)
+        target = copy_to_reg (op0);
+      else
+       emit_move_insn (target, op0);
      }
  
-  op1 = expand_binop (imode, and_optab, op1,
-                     immed_double_const (lo, hi, imode),
-                     NULL_RTX, 1, OPTAB_LIB_WIDEN);
-
    label = gen_label_rtx ();
-  emit_cmp_and_jump_insns (op1, const0_rtx, EQ, NULL_RTX, imode, 1, label);
+  emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
  
    if (GET_CODE (op0) == CONST_DOUBLE)
      op0 = simplify_unary_operation (NEG, mode, op0, mode);
@@ -3028,7 +3395,7 @@ struct no_conflict_data
     in the list of insns that constitute the actual no_conflict block /
     libcall block.  */
  static void
-no_conflict_move_test (rtx dest, rtx set, void *p0)
+no_conflict_move_test (rtx dest, const_rtx set, void *p0)
  {
    struct no_conflict_data *p= p0;
  
@@ -3058,6 +3425,44 @@ no_conflict_move_test (rtx dest, rtx set, void *p0)
      p->must_stay = true;
  }
  
+/* Encapsulate the block starting at FIRST and ending with LAST, which is
+   logically equivalent to EQUIV, so it gets manipulated as a unit if it
+   is possible to do so.  */
+
+void
+maybe_encapsulate_block (rtx first, rtx last, rtx equiv)
+{
+  if (!flag_non_call_exceptions || !may_trap_p (equiv))
+    {
+      /* We can't attach the REG_LIBCALL and REG_RETVAL notes when the
+        encapsulated region would not be in one basic block, i.e. when
+        there is a control_flow_insn_p insn between FIRST and LAST.  */
+      bool attach_libcall_retval_notes = true;
+      rtx insn, next = NEXT_INSN (last);
+
+      for (insn = first; insn != next; insn = NEXT_INSN (insn))
+       if (control_flow_insn_p (insn))
+         {
+           attach_libcall_retval_notes = false;
+           break;
+         }
+
+      if (attach_libcall_retval_notes)
+       {
+         REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last,
+                                                REG_NOTES (first));
+         REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first,
+                                               REG_NOTES (last));
+         next = NEXT_INSN (last);
+         for (insn = first; insn != next; insn = NEXT_INSN (insn))
+           REG_NOTES (insn) = gen_rtx_EXPR_LIST (REG_LIBCALL_ID,
+                                                 GEN_INT (libcall_id),
+                                                 REG_NOTES (insn));
+         libcall_id++;
+       }
+    }
+}
+
  /* Emit code to perform a series of operations on a multi-word quantity, one
     word at a time.
  
@@ -3114,6 +3519,8 @@ emit_no_conflict_block (rtx insns, rtx target, rtx op0, rtx op1, rtx equiv)
         remove_note (insn, note);
        if ((note = find_reg_note (insn, REG_RETVAL, NULL)) != NULL)
         remove_note (insn, note);
+      if ((note = find_reg_note (insn, REG_LIBCALL_ID, NULL)) != NULL)
+       remove_note (insn, note);
  
        data.target = target;
        data.first = insns;
@@ -3179,10 +3586,7 @@ emit_no_conflict_block (rtx insns, rtx target, rtx op0, rtx op1, rtx equiv)
    else
      first = NEXT_INSN (prev);
  
-  /* Encapsulate the block so it gets manipulated as a unit.  */
-  REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last,
-                                        REG_NOTES (first));
-  REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first, REG_NOTES (last));
+  maybe_encapsulate_block (first, last, equiv);
  
    return last;
  }
@@ -3211,7 +3615,6 @@ emit_no_conflict_block (rtx insns, rtx target, rtx op0, rtx op1, rtx equiv)
  
     Except for the first group of insns (the ones setting pseudos), the
     block is delimited by REG_RETVAL and REG_LIBCALL notes.  */
-
  void
  emit_libcall_block (rtx insns, rtx target, rtx result, rtx equiv)
  {
@@ -3270,6 +3673,8 @@ emit_libcall_block (rtx insns, rtx target, rtx result, rtx equiv)
         remove_note (insn, note);
        if ((note = find_reg_note (insn, REG_RETVAL, NULL)) != NULL)
         remove_note (insn, note);
+      if ((note = find_reg_note (insn, REG_LIBCALL_ID, NULL)) != NULL)
+       remove_note (insn, note);
  
        next = NEXT_INSN (insn);
  
@@ -3336,30 +3741,7 @@ emit_libcall_block (rtx insns, rtx target, rtx result, rtx equiv)
    else
      first = NEXT_INSN (prev);
  
-  /* Encapsulate the block so it gets manipulated as a unit.  */
-  if (!flag_non_call_exceptions || !may_trap_p (equiv))
-    {
-      /* We can't attach the REG_LIBCALL and REG_RETVAL notes
-        when the encapsulated region would not be in one basic block,
-        i.e. when there is a control_flow_insn_p insn between FIRST and LAST.
-       */
-      bool attach_libcall_retval_notes = true;
-      next = NEXT_INSN (last);
-      for (insn = first; insn != next; insn = NEXT_INSN (insn))
-       if (control_flow_insn_p (insn))
-         {
-           attach_libcall_retval_notes = false;
-           break;
-         }
-
-      if (attach_libcall_retval_notes)
-       {
-         REG_NOTES (first) = gen_rtx_INSN_LIST (REG_LIBCALL, last,
-                                                REG_NOTES (first));
-         REG_NOTES (last) = gen_rtx_INSN_LIST (REG_RETVAL, first,
-                                               REG_NOTES (last));
-       }
-    }
+  maybe_encapsulate_block (first, last, equiv);
  }
  \f
  /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
@@ -3427,9 +3809,6 @@ prepare_cmp_insn (rtx *px, rtx *py, enum rtx_code *pcomparison, rtx size,
    enum machine_mode mode = *pmode;
    rtx x = *px, y = *py;
    int unsignedp = *punsignedp;
-  enum mode_class class;
-
-  class = GET_MODE_CLASS (mode);
  
    /* If we are inside an appropriately-short loop and we are optimizing,
       force expensive constants into a register.  */
@@ -3534,7 +3913,7 @@ prepare_cmp_insn (rtx *px, rtx *py, enum rtx_code *pcomparison, rtx size,
  
    /* Handle a lib call just for the mode we are using.  */
  
-  if (cmp_optab->handlers[(int) mode].libfunc && class != MODE_FLOAT)
+  if (cmp_optab->handlers[(int) mode].libfunc && !SCALAR_FLOAT_MODE_P (mode))
      {
        rtx libfunc = cmp_optab->handlers[(int) mode].libfunc;
        rtx result;
@@ -3545,25 +3924,32 @@ prepare_cmp_insn (rtx *px, rtx *py, enum rtx_code *pcomparison, rtx size,
         libfunc = ucmp_optab->handlers[(int) mode].libfunc;
  
        result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST_MAKE_BLOCK,
-                                       word_mode, 2, x, mode, y, mode);
-
+                                       targetm.libgcc_cmp_return_mode (),
+                                       2, x, mode, y, mode);
+
+      /* There are two kinds of comparison routines. Biased routines
+        return 0/1/2, and unbiased routines return -1/0/1. Other parts
+        of gcc expect that the comparison operation is equivalent
+        to the modified comparison. For signed comparisons compare the 
+        result against 1 in the biased case, and zero in the unbiased
+        case. For unsigned comparisons always compare against 1 after
+        biasing the unbiased result by adding 1. This gives us a way to
+        represent LTU. */
        *px = result;
        *pmode = word_mode;
-      if (TARGET_LIB_INT_CMP_BIASED)
-       /* Integer comparison returns a result that must be compared
-          against 1, so that even if we do an unsigned compare
-          afterward, there is still a value that can represent the
-          result "less than".  */
-       *py = const1_rtx;
-      else
+      *py = const1_rtx;
+
+      if (!TARGET_LIB_INT_CMP_BIASED)
         {
-         *py = const0_rtx;
-         *punsignedp = 1;
+         if (*punsignedp)
+           *px = plus_constant (result, 1);  
+         else
+           *py = const0_rtx;
         }
        return;
      }
  
-  gcc_assert (class == MODE_FLOAT);
+  gcc_assert (SCALAR_FLOAT_MODE_P (mode));
    prepare_float_lib_cmp (px, py, pcomparison, pmode, punsignedp);
  }
  
@@ -3582,7 +3968,7 @@ prepare_operand (int icode, rtx x, int opnum, enum machine_mode mode,
    if (!insn_data[icode].operand[opnum].predicate
        (x, insn_data[icode].operand[opnum].mode))
      {
-      if (no_new_pseudos)
+      if (reload_completed)
         return NULL_RTX;
        x = copy_to_mode_reg (insn_data[icode].operand[opnum].mode, x);
      }
@@ -3647,8 +4033,7 @@ emit_cmp_and_jump_insn_1 (rtx x, rtx y, enum machine_mode mode,
           return;
         }
  
-      if (class != MODE_INT && class != MODE_FLOAT
-         && class != MODE_COMPLEX_FLOAT)
+      if (!CLASS_HAS_WIDER_MODES_P (class))
         break;
  
        wider_mode = GET_MODE_WIDER_MODE (wider_mode);
@@ -3684,9 +4069,11 @@ emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
    /* Swap operands and condition to ensure canonical RTL.  */
    if (swap_commutative_operands_p (x, y))
      {
-      /* If we're not emitting a branch, this means some caller
-         is out of sync.  */
-      gcc_assert (label);
+      /* If we're not emitting a branch, callers are required to pass
+        operands in an order conforming to canonical RTL.  We relax this
+        for commutative comparisons so callers using EQ don't need to do
+        swapping by hand.  */
+      gcc_assert (label || (comparison == swap_condition (comparison)));
  
        op0 = y, op1 = x;
        comparison = swap_condition (comparison);
@@ -3734,7 +4121,9 @@ prepare_float_lib_cmp (rtx *px, rtx *py, enum rtx_code *pcomparison,
    rtx libfunc = 0;
    bool reversed_p = false;
  
-  for (mode = orig_mode; mode != VOIDmode; mode = GET_MODE_WIDER_MODE (mode))
+  for (mode = orig_mode;
+       mode != VOIDmode;
+       mode = GET_MODE_WIDER_MODE (mode))
      {
        if ((libfunc = code_to_optab[comparison]->handlers[mode].libfunc))
         break;
@@ -4321,6 +4710,7 @@ expand_float (rtx to, rtx from, int unsignedp)
    enum insn_code icode;
    rtx target = to;
    enum machine_mode fmode, imode;
+  bool can_do_signed = false;
  
    /* Crash now, because we won't be able to decide which mode to use.  */
    gcc_assert (GET_MODE (from) != VOIDmode);
@@ -4342,8 +4732,14 @@ expand_float (rtx to, rtx from, int unsignedp)
           continue;
  
         icode = can_float_p (fmode, imode, unsignedp);
-       if (icode == CODE_FOR_nothing && imode != GET_MODE (from) && unsignedp)
-         icode = can_float_p (fmode, imode, 0), doing_unsigned = 0;
+       if (icode == CODE_FOR_nothing && unsignedp)
+         {
+           enum insn_code scode = can_float_p (fmode, imode, 0);
+           if (scode != CODE_FOR_nothing)
+             can_do_signed = true;
+           if (imode != GET_MODE (from))
+             icode = scode, doing_unsigned = 0;
+         }
  
         if (icode != CODE_FOR_nothing)
           {
@@ -4362,9 +4758,10 @@ expand_float (rtx to, rtx from, int unsignedp)
           }
        }
  
-  /* Unsigned integer, and no way to convert directly.
-     Convert as signed, then conditionally adjust the result.  */
-  if (unsignedp)
+  /* Unsigned integer, and no way to convert directly.  For binary
+     floating point modes, convert as signed, then conditionally adjust
+     the result.  */
+  if (unsignedp && can_do_signed && !DECIMAL_FLOAT_MODE_P (GET_MODE (to)))
      {
        rtx label = gen_label_rtx ();
        rtx temp;
@@ -4569,7 +4966,7 @@ expand_fix (rtx to, rtx from, int unsignedp)
       This is not needed.  Consider, for instance conversion from SFmode
       into DImode.
  
-     The hot path trought the code is dealing with inputs smaller than 2^63
+     The hot path through the code is dealing with inputs smaller than 2^63
       and doing just the conversion, so there is no bits to lose.
  
       In the other path we know the value is positive in the range 2^63..2^64-1
@@ -4681,6 +5078,46 @@ expand_fix (rtx to, rtx from, int unsignedp)
          convert_move (to, target, 0);
      }
  }
+
+/* Generate code to convert FROM to fixed point and store in TO.  FROM
+   must be floating point, TO must be signed.  Use the conversion optab
+   TAB to do the conversion.  */
+
+bool
+expand_sfix_optab (rtx to, rtx from, convert_optab tab)
+{
+  enum insn_code icode;
+  rtx target = to;
+  enum machine_mode fmode, imode;
+
+  /* We first try to find a pair of modes, one real and one integer, at
+     least as wide as FROM and TO, respectively, in which we can open-code
+     this conversion.  If the integer mode is wider than the mode of TO,
+     we can do the conversion either signed or unsigned.  */
+
+  for (fmode = GET_MODE (from); fmode != VOIDmode;
+       fmode = GET_MODE_WIDER_MODE (fmode))
+    for (imode = GET_MODE (to); imode != VOIDmode;
+        imode = GET_MODE_WIDER_MODE (imode))
+      {
+       icode = tab->handlers[imode][fmode].insn_code;
+       if (icode != CODE_FOR_nothing)
+         {
+           if (fmode != GET_MODE (from))
+             from = convert_to_mode (fmode, from, 0);
+
+           if (imode != GET_MODE (to))
+             target = gen_reg_rtx (imode);
+
+           emit_unop_insn (icode, target, from, UNKNOWN);
+           if (target != to)
+             convert_move (to, target, 0);
+           return true;
+         }
+      }
+
+  return false;
+}
  \f
  /* Report whether we have an instruction to perform the operation
     specified by CODE on operands of mode MODE.  */
@@ -4823,7 +5260,16 @@ init_integral_libfuncs (optab optable, const char *opname, int suffix)
  static void
  init_floating_libfuncs (optab optable, const char *opname, int suffix)
  {
+  char *dec_opname = alloca (sizeof (DECIMAL_PREFIX) + strlen (opname));
+
+  /* For BID support, change the name to have either a bid_ or dpd_ prefix
+     depending on the low level floating format used.  */
+  memcpy (dec_opname, DECIMAL_PREFIX, sizeof (DECIMAL_PREFIX) - 1);
+  strcpy (dec_opname + sizeof (DECIMAL_PREFIX) - 1, opname);
+
    init_libfuncs (optable, MIN_MODE_FLOAT, MAX_MODE_FLOAT, opname, suffix);
+  init_libfuncs (optable, MIN_MODE_DECIMAL_FLOAT, MAX_MODE_DECIMAL_FLOAT,
+                dec_opname, suffix);
  }
  
  /* Initialize the libfunc fields of an entire group of entries of an
@@ -4845,8 +5291,13 @@ init_interclass_conv_libfuncs (convert_optab tab, const char *opname,
    const char *fname, *tname;
    const char *q;
    char *libfunc_name, *suffix;
+  char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
    char *p;
  
+  /* If this is a decimal conversion, add the current BID vs. DPD prefix that
+     depends on which underlying decimal floating point format is used.  */
+  const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
+
    for (fmode = first_from_mode;
         fmode != VOIDmode;
         fmode = GET_MODE_WIDER_MODE (fmode))
@@ -4857,11 +5308,18 @@ init_interclass_conv_libfuncs (convert_optab tab, const char *opname,
         tmode = GET_MODE_WIDER_MODE (tmode))
      max_mname_len = MAX (max_mname_len, strlen (GET_MODE_NAME (tmode)));
  
-  libfunc_name = alloca (2 + opname_len + 2*max_mname_len + 1 + 1);
-  libfunc_name[0] = '_';
-  libfunc_name[1] = '_';
-  memcpy (&libfunc_name[2], opname, opname_len);
-  suffix = libfunc_name + opname_len + 2;
+  nondec_name = alloca (2 + opname_len + 2*max_mname_len + 1 + 1);
+  nondec_name[0] = '_';
+  nondec_name[1] = '_';
+  memcpy (&nondec_name[2], opname, opname_len);
+  nondec_suffix = nondec_name + opname_len + 2;
+
+  dec_name = alloca (2 + dec_len + opname_len + 2*max_mname_len + 1 + 1);
+  dec_name[0] = '_';
+  dec_name[1] = '_';
+  memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
+  memcpy (&dec_name[2+dec_len], opname, opname_len);
+  dec_suffix = dec_name + dec_len + opname_len + 2;
  
    for (fmode = first_from_mode; fmode != VOIDmode;
         fmode = GET_MODE_WIDER_MODE (fmode))
@@ -4871,6 +5329,17 @@ init_interclass_conv_libfuncs (convert_optab tab, const char *opname,
         fname = GET_MODE_NAME (fmode);
         tname = GET_MODE_NAME (tmode);
  
+       if (DECIMAL_FLOAT_MODE_P(fmode) || DECIMAL_FLOAT_MODE_P(tmode))
+         {
+           libfunc_name = dec_name;
+           suffix = dec_suffix;
+         }
+       else
+         {
+           libfunc_name = nondec_name;
+           suffix = nondec_suffix;
+         }
+
         p = suffix;
         for (q = fname; *q; p++, q++)
           *p = TOLOWER (*q);
@@ -4901,18 +5370,30 @@ init_intraclass_conv_libfuncs (convert_optab tab, const char *opname,
    enum machine_mode nmode, wmode;
    const char *nname, *wname;
    const char *q;
+  char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
    char *libfunc_name, *suffix;
    char *p;
  
+  /* If this is a decimal conversion, add the current BID vs. DPD prefix that
+     depends on which underlying decimal floating point format is used.  */
+  const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
+
    for (nmode = first_mode; nmode != VOIDmode;
         nmode = GET_MODE_WIDER_MODE (nmode))
      max_mname_len = MAX (max_mname_len, strlen (GET_MODE_NAME (nmode)));
  
-  libfunc_name = alloca (2 + opname_len + 2*max_mname_len + 1 + 1);
-  libfunc_name[0] = '_';
-  libfunc_name[1] = '_';
-  memcpy (&libfunc_name[2], opname, opname_len);
-  suffix = libfunc_name + opname_len + 2;
+  nondec_name = alloca (2 + opname_len + 2*max_mname_len + 1 + 1);
+  nondec_name[0] = '_';
+  nondec_name[1] = '_';
+  memcpy (&nondec_name[2], opname, opname_len);
+  nondec_suffix = nondec_name + opname_len + 2;
+
+  dec_name = alloca (2 + dec_len + opname_len + 2*max_mname_len + 1 + 1);
+  dec_name[0] = '_';
+  dec_name[1] = '_';
+  memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
+  memcpy (&dec_name[2 + dec_len], opname, opname_len);
+  dec_suffix = dec_name + dec_len + opname_len + 2;
  
    for (nmode = first_mode; nmode != VOIDmode;
         nmode = GET_MODE_WIDER_MODE (nmode))
@@ -4922,6 +5403,17 @@ init_intraclass_conv_libfuncs (convert_optab tab, const char *opname,
         nname = GET_MODE_NAME (nmode);
         wname = GET_MODE_NAME (wmode);
  
+       if (DECIMAL_FLOAT_MODE_P(nmode) || DECIMAL_FLOAT_MODE_P(wmode))
+         {
+           libfunc_name = dec_name;
+           suffix = dec_suffix;
+         }
+       else
+         {
+           libfunc_name = nondec_name;
+           suffix = nondec_suffix;
+         }
+
         p = suffix;
         for (q = widening ? nname : wname; *q; p++, q++)
           *p = TOLOWER (*q);
@@ -4958,7 +5450,7 @@ init_one_libfunc (const char *name)
  
    /* Zap the nonsensical SYMBOL_REF_DECL for this.  What we're left with
       are the flags assigned by targetm.encode_section_info.  */
-  SYMBOL_REF_DECL (symbol) = 0;
+  SET_SYMBOL_REF_DECL (symbol, 0);
  
    return symbol;
  }
@@ -4994,6 +5486,7 @@ void
  init_optabs (void)
  {
    unsigned int i;
+  enum machine_mode int_mode;
  
    /* Start by initializing all tables to contain CODE_FOR_nothing.  */
  
@@ -5021,6 +5514,11 @@ init_optabs (void)
    umul_highpart_optab = init_optab (UNKNOWN);
    smul_widen_optab = init_optab (UNKNOWN);
    umul_widen_optab = init_optab (UNKNOWN);
+  usmul_widen_optab = init_optab (UNKNOWN);
+  smadd_widen_optab = init_optab (UNKNOWN);
+  umadd_widen_optab = init_optab (UNKNOWN);
+  smsub_widen_optab = init_optab (UNKNOWN);
+  umsub_widen_optab = init_optab (UNKNOWN);
    sdiv_optab = init_optab (DIV);
    sdivv_optab = init_optabv (DIV);
    sdivmod_optab = init_optab (UNKNOWN);
@@ -5029,7 +5527,7 @@ init_optabs (void)
    smod_optab = init_optab (MOD);
    umod_optab = init_optab (UMOD);
    fmod_optab = init_optab (UNKNOWN);
-  drem_optab = init_optab (UNKNOWN);
+  remainder_optab = init_optab (UNKNOWN);
    ftrunc_optab = init_optab (UNKNOWN);
    and_optab = init_optab (AND);
    ior_optab = init_optab (IOR);
@@ -5052,6 +5550,8 @@ init_optabs (void)
    movstrict_optab = init_optab (STRICT_LOW_PART);
    cmp_optab = init_optab (COMPARE);
  
+  storent_optab = init_optab (UNKNOWN);
+
    ucmp_optab = init_optab (UNKNOWN);
    tst_optab = init_optab (UNKNOWN);
  
@@ -5069,6 +5569,7 @@ init_optabs (void)
    absv_optab = init_optabv (ABS);
    addcc_optab = init_optab (UNKNOWN);
    one_cmpl_optab = init_optab (NOT);
+  bswap_optab = init_optab (BSWAP);
    ffs_optab = init_optab (FFS);
    clz_optab = init_optab (CLZ);
    ctz_optab = init_optab (CTZ);
@@ -5076,14 +5577,11 @@ init_optabs (void)
    parity_optab = init_optab (PARITY);
    sqrt_optab = init_optab (SQRT);
    floor_optab = init_optab (UNKNOWN);
-  lfloor_optab = init_optab (UNKNOWN);
    ceil_optab = init_optab (UNKNOWN);
-  lceil_optab = init_optab (UNKNOWN);
    round_optab = init_optab (UNKNOWN);
    btrunc_optab = init_optab (UNKNOWN);
    nearbyint_optab = init_optab (UNKNOWN);
    rint_optab = init_optab (UNKNOWN);
-  lrint_optab = init_optab (UNKNOWN);
    sincos_optab = init_optab (UNKNOWN);
    sin_optab = init_optab (UNKNOWN);
    asin_optab = init_optab (UNKNOWN);
@@ -5094,6 +5592,7 @@ init_optabs (void)
    exp2_optab = init_optab (UNKNOWN);
    expm1_optab = init_optab (UNKNOWN);
    ldexp_optab = init_optab (UNKNOWN);
+  scalb_optab = init_optab (UNKNOWN);
    logb_optab = init_optab (UNKNOWN);
    ilogb_optab = init_optab (UNKNOWN);
    log_optab = init_optab (UNKNOWN);
@@ -5103,6 +5602,9 @@ init_optabs (void)
    tan_optab = init_optab (UNKNOWN);
    atan_optab = init_optab (UNKNOWN);
    copysign_optab = init_optab (UNKNOWN);
+  signbit_optab = init_optab (UNKNOWN);
+
+  isinf_optab = init_optab (UNKNOWN);
  
    strlen_optab = init_optab (UNKNOWN);
    cbranch_optab = init_optab (UNKNOWN);
@@ -5117,13 +5619,39 @@ init_optabs (void)
    reduc_splus_optab = init_optab (UNKNOWN);
    reduc_uplus_optab = init_optab (UNKNOWN);
  
+  ssum_widen_optab = init_optab (UNKNOWN);
+  usum_widen_optab = init_optab (UNKNOWN);
+  sdot_prod_optab = init_optab (UNKNOWN); 
+  udot_prod_optab = init_optab (UNKNOWN);
+
    vec_extract_optab = init_optab (UNKNOWN);
+  vec_extract_even_optab = init_optab (UNKNOWN);
+  vec_extract_odd_optab = init_optab (UNKNOWN);
+  vec_interleave_high_optab = init_optab (UNKNOWN);
+  vec_interleave_low_optab = init_optab (UNKNOWN);
    vec_set_optab = init_optab (UNKNOWN);
    vec_init_optab = init_optab (UNKNOWN);
    vec_shl_optab = init_optab (UNKNOWN);
    vec_shr_optab = init_optab (UNKNOWN);
    vec_realign_load_optab = init_optab (UNKNOWN);
    movmisalign_optab = init_optab (UNKNOWN);
+  vec_widen_umult_hi_optab = init_optab (UNKNOWN);
+  vec_widen_umult_lo_optab = init_optab (UNKNOWN);
+  vec_widen_smult_hi_optab = init_optab (UNKNOWN);
+  vec_widen_smult_lo_optab = init_optab (UNKNOWN);
+  vec_unpacks_hi_optab = init_optab (UNKNOWN);
+  vec_unpacks_lo_optab = init_optab (UNKNOWN);
+  vec_unpacku_hi_optab = init_optab (UNKNOWN);
+  vec_unpacku_lo_optab = init_optab (UNKNOWN);
+  vec_unpacks_float_hi_optab = init_optab (UNKNOWN);
+  vec_unpacks_float_lo_optab = init_optab (UNKNOWN);
+  vec_unpacku_float_hi_optab = init_optab (UNKNOWN);
+  vec_unpacku_float_lo_optab = init_optab (UNKNOWN);
+  vec_pack_trunc_optab = init_optab (UNKNOWN);
+  vec_pack_usat_optab = init_optab (UNKNOWN);
+  vec_pack_ssat_optab = init_optab (UNKNOWN);
+  vec_pack_ufix_trunc_optab = init_optab (UNKNOWN);
+  vec_pack_sfix_trunc_optab = init_optab (UNKNOWN);
  
    powi_optab = init_optab (UNKNOWN);
  
@@ -5137,6 +5665,10 @@ init_optabs (void)
    ufixtrunc_optab = init_convert_optab (UNKNOWN);
    sfloat_optab = init_convert_optab (FLOAT);
    ufloat_optab = init_convert_optab (UNSIGNED_FLOAT);
+  lrint_optab = init_convert_optab (UNKNOWN);
+  lround_optab = init_convert_optab (UNKNOWN);
+  lfloor_optab = init_convert_optab (UNKNOWN);
+  lceil_optab = init_convert_optab (UNKNOWN);
  
    for (i = 0; i < NUM_MACHINE_MODES; i++)
      {
@@ -5169,14 +5701,17 @@ init_optabs (void)
        sync_lock_test_and_set[i] = CODE_FOR_nothing;
        sync_lock_release[i] = CODE_FOR_nothing;
  
-#ifdef HAVE_SECONDARY_RELOADS
        reload_in_optab[i] = reload_out_optab[i] = CODE_FOR_nothing;
-#endif
      }
  
    /* Fill in the optabs with the insns we support.  */
    init_all_optabs ();
  
+  /* The ffs function operates on `int'.  Fall back on it if we do not
+     have a libgcc2 function for that width.  */
+  int_mode = mode_for_size (INT_TYPE_SIZE, MODE_INT, 0);
+  ffs_optab->handlers[(int) int_mode].libfunc = init_one_libfunc ("ffs");
+
    /* Initialize the optabs with the names of the library functions.  */
    init_integral_libfuncs (add_optab, "add", '3');
    init_floating_libfuncs (add_optab, "add", '3');
@@ -5242,14 +5777,45 @@ init_optabs (void)
    /* Conversions.  */
    init_interclass_conv_libfuncs (sfloat_optab, "float",
                                  MODE_INT, MODE_FLOAT);
+  init_interclass_conv_libfuncs (sfloat_optab, "float",
+                                MODE_INT, MODE_DECIMAL_FLOAT);
+  init_interclass_conv_libfuncs (ufloat_optab, "floatun",
+                                MODE_INT, MODE_FLOAT);
+  init_interclass_conv_libfuncs (ufloat_optab, "floatun",
+                                MODE_INT, MODE_DECIMAL_FLOAT);
    init_interclass_conv_libfuncs (sfix_optab, "fix",
                                  MODE_FLOAT, MODE_INT);
+  init_interclass_conv_libfuncs (sfix_optab, "fix",
+                                MODE_DECIMAL_FLOAT, MODE_INT);
    init_interclass_conv_libfuncs (ufix_optab, "fixuns",
                                  MODE_FLOAT, MODE_INT);
+  init_interclass_conv_libfuncs (ufix_optab, "fixuns",
+                                MODE_DECIMAL_FLOAT, MODE_INT);
+  init_interclass_conv_libfuncs (ufloat_optab, "floatuns",
+                                MODE_INT, MODE_DECIMAL_FLOAT);
+  init_interclass_conv_libfuncs (lrint_optab, "lrint",
+                                MODE_INT, MODE_FLOAT);
+  init_interclass_conv_libfuncs (lround_optab, "lround",
+                                MODE_INT, MODE_FLOAT);
+  init_interclass_conv_libfuncs (lfloor_optab, "lfloor",
+                                MODE_INT, MODE_FLOAT);
+  init_interclass_conv_libfuncs (lceil_optab, "lceil",
+                                MODE_INT, MODE_FLOAT);
  
    /* sext_optab is also used for FLOAT_EXTEND.  */
    init_intraclass_conv_libfuncs (sext_optab, "extend", MODE_FLOAT, true);
+  init_intraclass_conv_libfuncs (sext_optab, "extend", MODE_DECIMAL_FLOAT, true);
+  init_interclass_conv_libfuncs (sext_optab, "extend", MODE_FLOAT, MODE_DECIMAL_FLOAT);
+  init_interclass_conv_libfuncs (sext_optab, "extend", MODE_DECIMAL_FLOAT, MODE_FLOAT);
    init_intraclass_conv_libfuncs (trunc_optab, "trunc", MODE_FLOAT, false);
+  init_intraclass_conv_libfuncs (trunc_optab, "trunc", MODE_DECIMAL_FLOAT, false);
+  init_interclass_conv_libfuncs (trunc_optab, "trunc", MODE_FLOAT, MODE_DECIMAL_FLOAT);
+  init_interclass_conv_libfuncs (trunc_optab, "trunc", MODE_DECIMAL_FLOAT, MODE_FLOAT);
+
+  /* Explicitly initialize the bswap libfuncs since we need them to be
+     valid for things other than word_mode.  */
+  set_optab_libfunc (bswap_optab, SImode, "__bswapsi2");
+  set_optab_libfunc (bswap_optab, DImode, "__bswapdi2");
  
    /* Use cabs for double complex abs, since systems generally have cabs.
       Don't define any libcall for float complex, so that cabs will be used.  */
@@ -5257,10 +5823,6 @@ init_optabs (void)
      abs_optab->handlers[TYPE_MODE (complex_double_type_node)].libfunc
        = init_one_libfunc ("cabs");
  
-  /* The ffs function operates on `int'.  */
-  ffs_optab->handlers[(int) mode_for_size (INT_TYPE_SIZE, MODE_INT, 0)].libfunc
-    = init_one_libfunc ("ffs");
-
    abort_libfunc = init_one_libfunc ("abort");
    memcpy_libfunc = init_one_libfunc ("memcpy");
    memmove_libfunc = init_one_libfunc ("memmove");
@@ -5317,7 +5879,7 @@ debug_optab_libfuncs (void)
         h = &o->handlers[j];
         if (h->libfunc)
           {
-           gcc_assert (GET_CODE (h->libfunc) = SYMBOL_REF);
+           gcc_assert (GET_CODE (h->libfunc) == SYMBOL_REF);
             fprintf (stderr, "%s\t%s:\t%s\n",
                      GET_RTX_NAME (o->code),
                      GET_MODE_NAME (j),
@@ -5337,7 +5899,7 @@ debug_optab_libfuncs (void)
           h = &o->handlers[j][k];
           if (h->libfunc)
             {
-             gcc_assert (GET_CODE (h->libfunc) = SYMBOL_REF);
+             gcc_assert (GET_CODE (h->libfunc) == SYMBOL_REF);
               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
                        GET_RTX_NAME (o->code),
                        GET_MODE_NAME (j),
@@ -5472,8 +6034,10 @@ vector_compare_rtx (tree cond, bool unsignedp, enum insn_code icode)
    t_op1 = TREE_OPERAND (cond, 1);
  
    /* Expand operands.  */
-  rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)), 1);
-  rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)), 1);
+  rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
+                        EXPAND_STACK_PARM);
+  rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
+                        EXPAND_STACK_PARM);
  
    if (!insn_data[icode].operand[4].predicate (rtx_op0, GET_MODE (rtx_op0))
        && GET_MODE (rtx_op0) != VOIDmode)
@@ -5534,14 +6098,12 @@ expand_vec_cond_expr (tree vec_cond_expr, rtx target)
    cc_op0 = XEXP (comparison, 0);
    cc_op1 = XEXP (comparison, 1);
    /* Expand both operands and force them in reg, if required.  */
-  rtx_op1 = expand_expr (TREE_OPERAND (vec_cond_expr, 1),
-                        NULL_RTX, VOIDmode, 1);
+  rtx_op1 = expand_normal (TREE_OPERAND (vec_cond_expr, 1));
    if (!insn_data[icode].operand[1].predicate (rtx_op1, mode)
        && mode != VOIDmode)
      rtx_op1 = force_reg (mode, rtx_op1);
  
-  rtx_op2 = expand_expr (TREE_OPERAND (vec_cond_expr, 2),
-                        NULL_RTX, VOIDmode, 1);
+  rtx_op2 = expand_normal (TREE_OPERAND (vec_cond_expr, 2));
    if (!insn_data[icode].operand[2].predicate (rtx_op2, mode)
        && mode != VOIDmode)
      rtx_op2 = force_reg (mode, rtx_op2);