* optabs.h (OTI_flodiv, flodiv_optab): Kill.

[pf3gnuchains/gcc-fork.git] / gcc / sibcall.c
diff --git a/gcc/sibcall.c b/gcc/sibcall.c

index 120b641..a6638b7 100644 (file)
--- a/gcc/sibcall.c
+++ b/gcc/sibcall.c
@@ -1,5 +1,5 @@
  /* Generic sibling call optimization support
-   Copyright (C) 1999, 2000 Free Software Foundation, Inc.
+   Copyright (C) 1999, 2000, 2001 Free Software Foundation, Inc.
  
  This file is part of GNU CC.
  
@@ -32,14 +32,23 @@ Boston, MA 02111-1307, USA.  */
  #include "output.h"
  #include "except.h"
  
+/* In case alternate_exit_block contains copy from pseudo, to return value,
+   record the pseudo here.  In such case the pseudo must be set to function
+   return in the sibcall sequence.  */
+static rtx return_value_pseudo;
+
  static int identify_call_return_value  PARAMS ((rtx, rtx *, rtx *));
-static rtx skip_copy_to_return_value   PARAMS ((rtx, rtx, rtx));
+static rtx skip_copy_to_return_value   PARAMS ((rtx));
  static rtx skip_use_of_return_value    PARAMS ((rtx, enum rtx_code));
  static rtx skip_stack_adjustment       PARAMS ((rtx));
+static rtx skip_pic_restore            PARAMS ((rtx));
  static rtx skip_jump_insn              PARAMS ((rtx));
-static int uses_addressof              PARAMS ((rtx, int));
+static int call_ends_block_p           PARAMS ((rtx, rtx));
+static int uses_addressof              PARAMS ((rtx));
  static int sequence_uses_addressof     PARAMS ((rtx));
  static void purge_reg_equiv_notes      PARAMS ((void));
+static void purge_mem_unchanging_flag  PARAMS ((rtx));
+static rtx skip_unreturned_value       PARAMS ((rtx));
  
  /* Examine a CALL_PLACEHOLDER pattern and determine where the call's
     return value is located.  P_HARD_RETURN receives the hard register
@@ -82,6 +91,11 @@ identify_call_return_value (cp, p_hard_return, p_soft_return)
    if (! insn)
      return 0;
  
+  /* Restore of GP register may appear here.  */
+  insn = skip_pic_restore (insn);
+  if (! insn)
+    return 0;
+
    /* If there's nothing after, there's no soft return value.  */
    insn = NEXT_INSN (insn);
    if (! insn)
@@ -125,11 +139,15 @@ identify_call_return_value (cp, p_hard_return, p_soft_return)
     copy.  Otherwise return ORIG_INSN.  */
  
  static rtx
-skip_copy_to_return_value (orig_insn, hardret, softret)
+skip_copy_to_return_value (orig_insn)
       rtx orig_insn;
-     rtx hardret, softret;
  {
    rtx insn, set = NULL_RTX;
+  rtx hardret, softret;
+
+  /* If there is no return value, we have nothing to do.  */
+  if (! identify_call_return_value (PATTERN (orig_insn), &hardret, &softret))
+    return orig_insn;
  
    insn = next_nonnote_insn (orig_insn);
    if (! insn)
@@ -139,6 +157,13 @@ skip_copy_to_return_value (orig_insn, hardret, softret)
    if (! set)
      return orig_insn;
  
+  if (return_value_pseudo)
+    {
+      if (SET_DEST (set) == return_value_pseudo)
+        return insn;
+      return orig_insn;
+    }
+
    /* The destination must be the same as the called function's return
       value to ensure that any return value is put in the same place by the
       current function and the function we're calling. 
@@ -157,6 +182,30 @@ skip_copy_to_return_value (orig_insn, hardret, softret)
        && SET_SRC (set) == softret)
      return insn;
  
+  /* Recognize the situation when the called function's return value
+     is copied in two steps: first into an intermediate pseudo, then
+     the into the calling functions return value register.  */
+
+  if (REG_P (SET_DEST (set))
+      && SET_SRC (set) == softret)
+    {
+      rtx x = SET_DEST (set);
+
+      insn = next_nonnote_insn (insn);
+      if (! insn)
+       return orig_insn;
+
+      set = single_set (insn);
+      if (! set)
+       return orig_insn;
+
+      if (SET_DEST (set) == current_function_return_rtx
+         && REG_P (SET_DEST (set))
+         && OUTGOING_REGNO (REGNO (SET_DEST (set))) == REGNO (hardret)
+         && SET_SRC (set) == x)
+       return insn;
+    }
+
    /* It did not look like a copy of the return value, so return the
       same insn we were passed.  */
    return orig_insn;
@@ -184,6 +233,35 @@ skip_use_of_return_value (orig_insn, code)
    return orig_insn;
  }
  
+/* In case function does not return value,  we get clobber of pseudo followed
+   by set to hard return value.  */
+static rtx
+skip_unreturned_value (orig_insn)
+     rtx orig_insn;
+{
+  rtx insn = next_nonnote_insn (orig_insn);
+
+  /* Skip possible clobber of pseudo return register.  */
+  if (insn
+      && GET_CODE (insn) == INSN
+      && GET_CODE (PATTERN (insn)) == CLOBBER
+      && REG_P (XEXP (PATTERN (insn), 0))
+      && (REGNO (XEXP (PATTERN (insn), 0)) >= FIRST_PSEUDO_REGISTER))
+    {
+      rtx set_insn = next_nonnote_insn (insn);
+      rtx set;
+      if (!set_insn)
+       return insn;
+      set = single_set (set_insn);
+      if (!set
+         || SET_SRC (set) != XEXP (PATTERN (insn), 0)
+         || SET_DEST (set) != current_function_return_rtx)
+       return insn;
+      return set_insn;
+    }
+  return orig_insn;
+}
+
  /* If the first real insn after ORIG_INSN adjusts the stack pointer
     by a constant, return the insn with the stack pointer adjustment.
     Otherwise return ORIG_INSN.  */
@@ -199,10 +277,6 @@ skip_stack_adjustment (orig_insn)
    if (insn)
      set = single_set (insn);
  
-  /* The source must be the same as the current function's return value to
-     ensure that any return value is put in the same place by the current
-     function and the function we're calling.   The destination register
-     must be a pseudo.  */
    if (insn
        && set
        && GET_CODE (SET_SRC (set)) == PLUS
@@ -211,8 +285,26 @@ skip_stack_adjustment (orig_insn)
        && SET_DEST (set) == stack_pointer_rtx)
      return insn;
  
-  /* It did not look like a copy of the return value, so return the
-     same insn we were passed.  */
+  return orig_insn;
+}
+
+/* If the first real insn after ORIG_INSN sets the pic register,
+   return it.  Otherwise return ORIG_INSN.  */
+
+static rtx
+skip_pic_restore (orig_insn)
+     rtx orig_insn;
+{
+  rtx insn, set = NULL_RTX;
+
+  insn = next_nonnote_insn (orig_insn);
+
+  if (insn)
+    set = single_set (insn);
+
+  if (insn && set && SET_DEST (set) == pic_offset_table_rtx)
+    return insn;
+
    return orig_insn;
  }
  
@@ -234,19 +326,72 @@ skip_jump_insn (orig_insn)
  
    return orig_insn;
  }
+\f
+/* Using the above functions, see if INSN, skipping any of the above,
+   goes all the way to END, the end of a basic block.  Return 1 if so.  */
+
+static int
+call_ends_block_p (insn, end)
+     rtx insn;
+     rtx end;
+{
+  rtx new_insn;
+  /* END might be a note, so get the last nonnote insn of the block.  */
+  end = next_nonnote_insn (PREV_INSN (end));
+
+  /* If the call was the end of the block, then we're OK.  */
+  if (insn == end)
+    return 1;
+
+  /* Skip over copying from the call's return value pseudo into
+     this function's hard return register and if that's the end
+     of the block, we're OK.  */
+  new_insn = skip_copy_to_return_value (insn);
+
+  /* In case we return value in pseudo, we must set the pseudo to
+     return value of called function, otherwise we are returning
+     something else.  */
+  if (return_value_pseudo && insn == new_insn)
+    return 0;
+  insn = new_insn;
+
+  if (insn == end)
+    return 1;
+
+  /* Skip any stack adjustment.  */
+  insn = skip_stack_adjustment (insn);
+  if (insn == end)
+    return 1;
+
+  /* Skip over a CLOBBER of the return value as a hard reg.  */
+  insn = skip_use_of_return_value (insn, CLOBBER);
+  if (insn == end)
+    return 1;
+
+  /* Skip over a CLOBBER of the return value as a hard reg.  */
+  insn = skip_unreturned_value (insn);
+  if (insn == end)
+    return 1;
+
+  /* Skip over a USE of the return value (as a hard reg).  */
+  insn = skip_use_of_return_value (insn, USE);
+  if (insn == end)
+    return 1;
+
+  /* Skip over a JUMP_INSN at the end of the block.  If that doesn't end the
+     block, the original CALL_INSN didn't.  */
+  insn = skip_jump_insn (insn);
+  return insn == end;
+}
  
  /* Scan the rtx X for ADDRESSOF expressions or
     current_function_internal_arg_pointer registers.
-   INMEM argument should be 1 if we're looking at inner part of some
-   MEM expression, otherwise 0.
-   Return nonzero if an ADDRESSOF expresion is found or if
-   current_function_internal_arg_pointer is found outside of some MEM
-   expression, else return zero.  */
+   Return nonzero if an ADDRESSOF or current_function_internal_arg_pointer
+   is found outside of some MEM expression, else return zero.  */
  
  static int
-uses_addressof (x, inmem)
+uses_addressof (x)
       rtx x;
-     int inmem;
  {
    RTX_CODE code;
    int i, j;
@@ -257,28 +402,25 @@ uses_addressof (x, inmem)
  
    code = GET_CODE (x);
  
-  if (code == ADDRESSOF)
-    return 1;
-
-  if (x == current_function_internal_arg_pointer && ! inmem)
+  if (code == ADDRESSOF || x == current_function_internal_arg_pointer)
      return 1;
  
    if (code == MEM)
-    return uses_addressof (XEXP (x, 0), 1);
+    return 0;
  
-  /* Scan all subexpressions. */
+  /* Scan all subexpressions.  */
    fmt = GET_RTX_FORMAT (code);
    for (i = 0; i < GET_RTX_LENGTH (code); i++, fmt++)
      {
        if (*fmt == 'e')
         {
-         if (uses_addressof (XEXP (x, i), inmem))
+         if (uses_addressof (XEXP (x, i)))
             return 1;
         }
        else if (*fmt == 'E')
         {
           for (j = 0; j < XVECLEN (x, i); j++)
-           if (uses_addressof (XVECEXP (x, i, j), inmem))
+           if (uses_addressof (XVECEXP (x, i, j)))
               return 1;
         }
      }
@@ -301,7 +443,7 @@ sequence_uses_addressof (seq)
    rtx insn;
  
    for (insn = seq; insn; insn = NEXT_INSN (insn))
-    if (GET_RTX_CLASS (GET_CODE (insn)) == 'i')
+    if (INSN_P (insn))
        {
         /* If this is a CALL_PLACEHOLDER, then recursively call ourselves
            with each nonempty sequence attached to the CALL_PLACEHOLDER.  */
@@ -318,8 +460,8 @@ sequence_uses_addressof (seq)
                 && sequence_uses_addressof (XEXP (PATTERN (insn), 2)))
               return 1;
           }
-       else if (uses_addressof (PATTERN (insn), 0)
-                || (REG_NOTES (insn) && uses_addressof (REG_NOTES (insn), 0)))
+       else if (uses_addressof (PATTERN (insn))
+                || (REG_NOTES (insn) && uses_addressof (REG_NOTES (insn))))
           return 1;
        }
    return 0;
@@ -349,6 +491,45 @@ purge_reg_equiv_notes ()
      }
  }
  
+/* Clear RTX_UNCHANGING_P flag of incoming argument MEMs.  */
+
+static void
+purge_mem_unchanging_flag (x)
+     rtx x;
+{
+  RTX_CODE code;
+  int i, j;
+  const char *fmt;
+
+  if (x == NULL_RTX)
+    return;
+
+  code = GET_CODE (x);
+
+  if (code == MEM)
+    {
+      if (RTX_UNCHANGING_P (x)
+         && (XEXP (x, 0) == current_function_internal_arg_pointer
+             || (GET_CODE (XEXP (x, 0)) == PLUS
+                 && XEXP (XEXP (x, 0), 0) ==
+                    current_function_internal_arg_pointer
+                 && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT)))
+       RTX_UNCHANGING_P (x) = 0;
+      return;
+    }
+
+  /* Scan all subexpressions.  */
+  fmt = GET_RTX_FORMAT (code);
+  for (i = 0; i < GET_RTX_LENGTH (code); i++, fmt++)
+    {
+      if (*fmt == 'e')
+       purge_mem_unchanging_flag (XEXP (x, i));
+      else if (*fmt == 'E')
+       for (j = 0; j < XVECLEN (x, i); j++)
+         purge_mem_unchanging_flag (XVECEXP (x, i, j));
+    }
+}
+
  /* Replace the CALL_PLACEHOLDER with one of its children.  INSN should be
     the CALL_PLACEHOLDER insn; USE tells which child to use.  */
  
@@ -372,7 +553,7 @@ replace_call_placeholder (insn, use)
    if (XEXP (PATTERN (insn), 3))
      LABEL_PRESERVE_P (XEXP (PATTERN (insn), 3)) = 0;
    
-  /* "Delete" the placeholder insn. */
+  /* "Delete" the placeholder insn.  */
    PUT_CODE (insn, NOTE);
    NOTE_SOURCE_FILE (insn) = 0;
    NOTE_LINE_NUMBER (insn) = NOTE_INSN_DELETED;
@@ -405,20 +586,18 @@ optimize_sibling_and_tail_recursive_calls ()
       ahead and find all the EH labels.  */
    find_exception_handler_labels ();
  
-  /* Run a jump optimization pass to clean up the CFG.  We primarily want
-     this to thread jumps so that it is obvious which blocks jump to the
-     epilouge.  */
-  jump_optimize_minimal (insns);
-
+  rebuild_jump_labels (insns);
    /* We need cfg information to determine which blocks are succeeded
       only by the epilogue.  */
    find_basic_blocks (insns, max_reg_num (), 0);
-  cleanup_cfg (insns);
+  cleanup_cfg (CLEANUP_PRE_SIBCALL | CLEANUP_PRE_LOOP);
  
    /* If there are no basic blocks, then there is nothing to do.  */
    if (n_basic_blocks == 0)
      return;
  
+  return_value_pseudo = NULL_RTX;
+
    /* Find the exit block.
  
       It is possible that we have blocks which can reach the exit block
@@ -439,6 +618,7 @@ optimize_sibling_and_tail_recursive_calls ()
            insn;
            insn = NEXT_INSN (insn))
         {
+         rtx set;
           /* This should only happen once, at the start of this block.  */
           if (GET_CODE (insn) == CODE_LABEL)
             continue;
@@ -450,6 +630,18 @@ optimize_sibling_and_tail_recursive_calls ()
               && GET_CODE (PATTERN (insn)) == USE)
             continue;
  
+         /* Exit block also may contain copy from pseudo containing
+            return value to hard register.  */
+         if (GET_CODE (insn) == INSN
+             && (set = single_set (insn))
+             && SET_DEST (set) == current_function_return_rtx
+             && REG_P (SET_SRC (set))
+             && !return_value_pseudo)
+           {
+             return_value_pseudo = SET_SRC (set);
+             continue;
+           }
+
           break;
         }
  
@@ -458,6 +650,8 @@ optimize_sibling_and_tail_recursive_calls ()
          valid alternate exit block.  */
        if (insn == NULL)
         alternate_exit = e->src;
+      else
+       return_value_pseudo = NULL;
      }
  
    /* If the function uses ADDRESSOF, we can't (easily) determine
@@ -480,94 +674,45 @@ optimize_sibling_and_tail_recursive_calls ()
         {
           int sibcall = (XEXP (PATTERN (insn), 1) != NULL_RTX);
           int tailrecursion = (XEXP (PATTERN (insn), 2) != NULL_RTX);
-         basic_block succ_block, call_block;
-         rtx temp, hardret, softret;
-
-         /* We must be careful with stack slots which are live at
-            potential optimization sites.
-
-            ?!? This test is overly conservative and will be replaced.  */
-         if (frame_offset)
-           goto failure;
+         basic_block call_block = BLOCK_FOR_INSN (insn);
  
           /* alloca (until we have stack slot life analysis) inhibits
              sibling call optimizations, but not tail recursion.
-
-            Similarly if we have ADDRESSOF expressions.
-
              Similarly if we use varargs or stdarg since they implicitly
              may take the address of an argument.  */
-         if (current_function_calls_alloca || current_function_uses_addressof
+         if (current_function_calls_alloca
               || current_function_varargs || current_function_stdarg)
             sibcall = 0;
  
-         call_block = BLOCK_FOR_INSN (insn);
-
-         /* If the block has more than one successor, then we can not
-            perform sibcall or tail recursion optimizations.  */
-         if (call_block->succ == NULL
-             || call_block->succ->succ_next != NULL)
-           goto failure;
-
-         /* If the single successor is not the exit block, then we can not
-            perform sibcall or tail recursion optimizations. 
-
-            Note that this test combined with the previous is sufficient
-            to prevent tail call optimization in the presense of active
-            exception handlers.  */
-         succ_block = call_block->succ->dest;
-         if (succ_block != EXIT_BLOCK_PTR && succ_block != alternate_exit)
-           goto failure;
-
-         /* If the call was the end of the block, then we're OK.  */
-         temp = insn;
-         if (temp == call_block->end)
-           goto success;
-
-         /* Skip over copying from the call's return value pseudo into
-            this function's hard return register.  */
-         if (identify_call_return_value (PATTERN (insn), &hardret, &softret))
-           {
-             temp = skip_copy_to_return_value (temp, hardret, softret);
-             if (temp == call_block->end)
-               goto success;
-           }
-
-         /* Skip any stack adjustment.  */
-         temp = skip_stack_adjustment (temp);
-         if (temp == call_block->end)
-           goto success;
-
-         /* Skip over a CLOBBER of the return value (as a hard reg).  */
-         temp = skip_use_of_return_value (temp, CLOBBER);
-         if (temp == call_block->end)
-           goto success;
-
-         /* Skip over a USE of the return value (as a hard reg).  */
-         temp = skip_use_of_return_value (temp, USE);
-         if (temp == call_block->end)
-           goto success;
-
-         /* Skip over the JUMP_INSN at the end of the block.  */
-         temp = skip_jump_insn (temp);
-         if (GET_CODE (temp) == NOTE)
-           temp = next_nonnote_insn (temp);
-         if (temp == call_block->end)
-           goto success;
-
-         /* There are operations at the end of the block which we must
-            execute after returning from the function call.  So this call
-            can not be optimized.  */
-failure:
-         sibcall = 0, tailrecursion = 0;
-success:
+         /* See if there are any reasons we can't perform either sibling or
+            tail call optimizations.  We must be careful with stack slots
+            which are live at potential optimization sites.  ??? The first
+            test is overly conservative and should be replaced.  */
+         if (frame_offset
+             /* Can't take address of local var if used by recursive call.  */
+             || current_function_uses_addressof
+             /* Any function that calls setjmp might have longjmp called from
+                any called function.  ??? We really should represent this
+                properly in the CFG so that this needn't be special cased.  */
+             || current_function_calls_setjmp
+             /* Can't if more than one successor or single successor is not
+                exit block.  These two tests prevent tail call optimization
+                in the presense of active exception handlers.  */
+             || call_block->succ == NULL
+             || call_block->succ->succ_next != NULL
+             || (call_block->succ->dest != EXIT_BLOCK_PTR
+                 && call_block->succ->dest != alternate_exit)
+             /* If this call doesn't end the block, there are operations at
+                the end of the block which we must execute after returning.  */
+             || ! call_ends_block_p (insn, call_block->end))
+           sibcall = 0, tailrecursion = 0;
  
           /* Select a set of insns to implement the call and emit them.
              Tail recursion is the most efficient, so select it over
              a tail/sibling call.  */
-  
           if (sibcall)
             successful_sibling_call = 1;
+
           replaced_call_placeholder = 1;
           replace_call_placeholder (insn, 
                                     tailrecursion != 0 
@@ -578,18 +723,39 @@ success:
         }
      }
  
-  /* A sibling call sequence invalidates any REG_EQUIV notes made for
-     this function's incoming arguments. 
-
-     At the start of RTL generation we know the only REG_EQUIV notes
-     in the rtl chain are those for incoming arguments, so we can safely
-     flush any REG_EQUIV note. 
-
-     This is (slight) overkill.  We could keep track of the highest argument
-     we clobber and be more selective in removing notes, but it does not
-     seem to be worth the effort.  */
    if (successful_sibling_call)
-    purge_reg_equiv_notes ();
+    {
+      rtx insn;
+
+      /* A sibling call sequence invalidates any REG_EQUIV notes made for
+        this function's incoming arguments. 
+
+        At the start of RTL generation we know the only REG_EQUIV notes
+        in the rtl chain are those for incoming arguments, so we can safely
+        flush any REG_EQUIV note. 
+
+        This is (slight) overkill.  We could keep track of the highest
+        argument we clobber and be more selective in removing notes, but it
+        does not seem to be worth the effort.  */
+      purge_reg_equiv_notes ();
+
+      /* A sibling call sequence also may invalidate RTX_UNCHANGING_P
+        flag of some incoming arguments MEM RTLs, because it can write into
+        those slots.  We clear all those bits now.
+        
+        This is (slight) overkill, we could keep track of which arguments
+        we actually write into.  */
+      for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
+       {
+         if (GET_CODE (insn) == NOTE)
+           {
+             if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_FUNCTION_BEG)
+               break;
+           }
+         else if (INSN_P (insn))
+           purge_mem_unchanging_flag (PATTERN (insn));
+       }
+    }
  
    /* There may have been NOTE_INSN_BLOCK_{BEGIN,END} notes in the 
       CALL_PLACEHOLDER alternatives that we didn't emit.  Rebuild the