PR target/44707

[pf3gnuchains/gcc-fork.git] / gcc / ipa-inline.c
diff --git a/gcc/ipa-inline.c b/gcc/ipa-inline.c

index 75adb01..b5063bf 100644 (file)
--- a/gcc/ipa-inline.c
+++ b/gcc/ipa-inline.c
@@ -128,6 +128,7 @@ along with GCC; see the file COPYING3.  If not see
  #include "flags.h"
  #include "cgraph.h"
  #include "diagnostic.h"
+#include "gimple-pretty-print.h"
  #include "timevar.h"
  #include "params.h"
  #include "fibheap.h"
@@ -200,11 +201,12 @@ cgraph_estimate_time_after_inlining (int frequency, struct cgraph_node *to,
  
  /* Estimate self time of the function after inlining WHAT into TO.  */
  
-static int
+static inline int
  cgraph_estimate_size_after_inlining (int times, struct cgraph_node *to,
                                      struct cgraph_node *what)
  {
-  int size = (what->global.size - inline_summary (what)->size_inlining_benefit) * times + to->global.size;
+  int size = ((what->global.size - inline_summary (what)->size_inlining_benefit)
+             * times + to->global.size);
    gcc_assert (size >= 0);
    return size;
  }
@@ -268,7 +270,8 @@ cgraph_clone_inlined_nodes (struct cgraph_edge *e, bool duplicate,
        else
         {
           struct cgraph_node *n;
-         n = cgraph_clone_node (e->callee, e->count, e->frequency, e->loop_nest,
+         n = cgraph_clone_node (e->callee, e->callee->decl,
+                                e->count, e->frequency, e->loop_nest,
                                  update_original, NULL);
           cgraph_redirect_edge_callee (e, n);
         }
@@ -310,10 +313,7 @@ cgraph_mark_inline_edge (struct cgraph_edge *e, bool update_original,
  
    gcc_assert (e->inline_failed);
    e->inline_failed = CIF_OK;
-
-  if (!e->callee->global.inlined)
-    DECL_POSSIBLY_INLINED (e->callee->decl) = true;
-  e->callee->global.inlined = true;
+  DECL_POSSIBLY_INLINED (e->callee->decl) = true;
  
    cgraph_clone_inlined_nodes (e, true, update_original);
  
@@ -334,7 +334,9 @@ cgraph_mark_inline_edge (struct cgraph_edge *e, bool update_original,
      overall_size += new_size - old_size;
    ncalls_inlined++;
  
-  if (flag_indirect_inlining)
+  /* FIXME: We should remove the optimize check after we ensure we never run
+     IPA passes when not optimizng.  */
+  if (flag_indirect_inlining && optimize)
      return ipa_propagate_indirect_call_infos (curr, new_edges);
    else
      return false;
@@ -389,7 +391,7 @@ cgraph_estimate_growth (struct cgraph_node *node)
       we decide to not inline for different reasons, but it is not big deal
       as in that case we will keep the body around, but we will also avoid
       some inlining.  */
-  if (cgraph_only_called_directly_p (node)
+  if (cgraph_will_be_removed_from_program_if_no_direct_calls (node)
        && !DECL_EXTERNAL (node->decl) && !self_recursive)
      growth -= node->global.size;
  
@@ -512,7 +514,7 @@ cgraph_default_inline_p (struct cgraph_node *n, cgraph_inline_failed_t *reason)
     We call recursive inlining all cases where same function appears more than
     once in the single recursion nest path in the inline graph.  */
  
-static bool
+static inline bool
  cgraph_recursive_inlining_p (struct cgraph_node *to,
                              struct cgraph_node *what,
                              cgraph_inline_failed_t *reason)
@@ -544,6 +546,9 @@ cgraph_edge_badness (struct cgraph_edge *edge, bool dump)
      (cgraph_estimate_size_after_inlining (1, edge->caller, edge->callee)
       - edge->caller->global.size);
  
+  if (edge->callee->local.disregard_inline_limits)
+    return INT_MIN;
+
    if (dump)
      {
        fprintf (dump_file, "    Badness calculcation for %s -> %s\n",
@@ -658,6 +663,30 @@ cgraph_edge_badness (struct cgraph_edge *edge, bool dump)
      return badness;
  }
  
+/* Recompute badness of EDGE and update its key in HEAP if needed.  */
+static void
+update_edge_key (fibheap_t heap, struct cgraph_edge *edge)
+{
+  int badness = cgraph_edge_badness (edge, false);
+  if (edge->aux)
+    {
+      fibnode_t n = (fibnode_t) edge->aux;
+      gcc_checking_assert (n->data == edge);
+
+      /* fibheap_replace_key only decrease the keys.
+        When we increase the key we do not update heap
+        and instead re-insert the element once it becomes
+        a minium of heap.  */
+      if (badness < n->key)
+       {
+         fibheap_replace_key (heap, n, badness);
+         gcc_checking_assert (n->key == badness);
+       }
+    }
+  else
+    edge->aux = fibheap_insert (heap, badness, edge);
+}
+
  /* Recompute heap nodes for each of caller edge.  */
  
  static void
@@ -667,7 +696,7 @@ update_caller_keys (fibheap_t heap, struct cgraph_node *node,
    struct cgraph_edge *edge;
    cgraph_inline_failed_t failed_reason;
  
-  if (!node->local.inlinable || node->local.disregard_inline_limits
+  if (!node->local.inlinable
        || node->global.inlined_to)
      return;
    if (bitmap_bit_p (updated_nodes, node->uid))
@@ -675,12 +704,16 @@ update_caller_keys (fibheap_t heap, struct cgraph_node *node,
    bitmap_set_bit (updated_nodes, node->uid);
    node->global.estimated_growth = INT_MIN;
  
-  if (!node->local.inlinable)
+  /* See if there is something to do.  */
+  for (edge = node->callers; edge; edge = edge->next_caller)
+    if (edge->inline_failed)
+      break;
+  if (!edge)
      return;
    /* Prune out edges we won't inline into anymore.  */
    if (!cgraph_default_inline_p (node, &failed_reason))
      {
-      for (edge = node->callers; edge; edge = edge->next_caller)
+      for (; edge; edge = edge->next_caller)
         if (edge->aux)
           {
             fibheap_delete_node (heap, (fibnode_t) edge->aux);
@@ -691,44 +724,91 @@ update_caller_keys (fibheap_t heap, struct cgraph_node *node,
        return;
      }
  
-  for (edge = node->callers; edge; edge = edge->next_caller)
+  for (; edge; edge = edge->next_caller)
      if (edge->inline_failed)
+      update_edge_key (heap, edge);
+}
+
+/* Recompute heap nodes for each uninlined call.
+   This is used when we know that edge badnesses are going only to increase
+   (we introduced new call site) and thus all we need is to insert newly
+   created edges into heap.  */
+
+static void
+update_callee_keys (fibheap_t heap, struct cgraph_node *node,
+                   bitmap updated_nodes)
+{
+  struct cgraph_edge *e = node->callees;
+  node->global.estimated_growth = INT_MIN;
+
+  if (!e)
+    return;
+  while (true)
+    if (!e->inline_failed && e->callee->callees)
+      e = e->callee->callees;
+    else
        {
-       int badness = cgraph_edge_badness (edge, false);
-       if (edge->aux)
+       if (e->inline_failed
+           && e->callee->local.inlinable
+           && !bitmap_bit_p (updated_nodes, e->callee->uid))
           {
-           fibnode_t n = (fibnode_t) edge->aux;
-           gcc_assert (n->data == edge);
-           if (n->key == badness)
-             continue;
-
-           /* fibheap_replace_key only increase the keys.  */
-           if (badness < n->key)
+           node->global.estimated_growth = INT_MIN;
+           /* If function becomes uninlinable, we need to remove it from the heap.  */
+           if (!cgraph_default_inline_p (e->callee, &e->inline_failed))
+             update_caller_keys (heap, e->callee, updated_nodes);
+           else
+           /* Otherwise update just edge E.  */
+             update_edge_key (heap, e);
+         }
+       if (e->next_callee)
+         e = e->next_callee;
+       else
+         {
+           do
               {
-               fibheap_replace_key (heap, n, badness);
-               gcc_assert (n->key == badness);
-               continue;
+               if (e->caller == node)
+                 return;
+               e = e->caller->callers;
               }
-           fibheap_delete_node (heap, (fibnode_t) edge->aux);
+           while (!e->next_callee);
+           e = e->next_callee;
           }
-       edge->aux = fibheap_insert (heap, badness, edge);
        }
  }
  
-/* Recompute heap nodes for each of caller edges of each of callees.  */
+/* Recompute heap nodes for each of caller edges of each of callees.
+   Walk recursively into all inline clones.  */
  
  static void
-update_callee_keys (fibheap_t heap, struct cgraph_node *node,
-                   bitmap updated_nodes)
+update_all_callee_keys (fibheap_t heap, struct cgraph_node *node,
+                       bitmap updated_nodes)
  {
-  struct cgraph_edge *e;
+  struct cgraph_edge *e = node->callees;
    node->global.estimated_growth = INT_MIN;
  
-  for (e = node->callees; e; e = e->next_callee)
-    if (e->inline_failed)
-      update_caller_keys (heap, e->callee, updated_nodes);
-    else if (!e->inline_failed)
-      update_callee_keys (heap, e->callee, updated_nodes);
+  if (!e)
+    return;
+  while (true)
+    if (!e->inline_failed && e->callee->callees)
+      e = e->callee->callees;
+    else
+      {
+       if (e->inline_failed)
+         update_caller_keys (heap, e->callee, updated_nodes);
+       if (e->next_callee)
+         e = e->next_callee;
+       else
+         {
+           do
+             {
+               if (e->caller == node)
+                 return;
+               e = e->caller->callers;
+             }
+           while (!e->next_callee);
+           e = e->next_callee;
+         }
+      }
  }
  
  /* Enqueue all recursive calls from NODE into priority queue depending on
@@ -808,7 +888,8 @@ cgraph_decide_recursive_inlining (struct cgraph_node *node,
              cgraph_node_name (node));
  
    /* We need original clone to copy around.  */
-  master_clone = cgraph_clone_node (node, node->count, CGRAPH_FREQ_BASE, 1,
+  master_clone = cgraph_clone_node (node, node->decl,
+                                   node->count, CGRAPH_FREQ_BASE, 1,
                                     false, NULL);
    master_clone->needed = true;
    for (e = master_clone->callees; e; e = e->next_callee)
@@ -936,7 +1017,9 @@ add_new_edges_to_heap (fibheap_t heap, VEC (cgraph_edge_p, heap) *new_edges)
        struct cgraph_edge *edge = VEC_pop (cgraph_edge_p, new_edges);
  
        gcc_assert (!edge->aux);
-      edge->aux = fibheap_insert (heap, cgraph_edge_badness (edge, false), edge);
+      if (edge->callee->local.inlinable
+         && cgraph_default_inline_p (edge->callee, &edge->inline_failed))
+        edge->aux = fibheap_insert (heap, cgraph_edge_badness (edge, false), edge);
      }
  }
  
@@ -998,6 +1081,7 @@ cgraph_decide_inlining_of_small_functions (void)
        int old_size = overall_size;
        struct cgraph_node *where, *callee;
        int badness = fibheap_min_key (heap);
+      int current_badness;
        int growth;
        cgraph_inline_failed_t not_good = CIF_OK;
  
@@ -1006,9 +1090,18 @@ cgraph_decide_inlining_of_small_functions (void)
        edge->aux = NULL;
        if (!edge->inline_failed)
         continue;
-#ifdef ENABLE_CHECKING
-      gcc_assert (cgraph_edge_badness (edge, false) == badness);
-#endif
+
+      /* When updating the edge costs, we only decrease badness in the keys.
+        When the badness increase, we keep the heap as it is and re-insert
+        key now.  */
+      current_badness = cgraph_edge_badness (edge, false);
+      gcc_assert (current_badness >= badness);
+      if (current_badness != badness)
+       {
+         edge->aux = fibheap_insert (heap, current_badness, edge);
+         continue;
+       }
+      
        callee = edge->callee;
  
        growth = (cgraph_estimate_size_after_inlining (1, edge->caller, edge->callee)
@@ -1071,12 +1164,14 @@ cgraph_decide_inlining_of_small_functions (void)
             }
         }
  
-      if (!cgraph_maybe_hot_edge_p (edge))
+      if (edge->callee->local.disregard_inline_limits)
+       ;
+      else if (!cgraph_maybe_hot_edge_p (edge))
         not_good = CIF_UNLIKELY_CALL;
-      if (!flag_inline_functions
+      else if (!flag_inline_functions
           && !DECL_DECLARED_INLINE_P (edge->callee->decl))
         not_good = CIF_NOT_DECLARED_INLINED;
-      if (optimize_function_for_size_p (DECL_STRUCT_FUNCTION(edge->caller->decl)))
+      else if (optimize_function_for_size_p (DECL_STRUCT_FUNCTION(edge->caller->decl)))
         not_good = CIF_OPTIMIZING_FOR_SIZE;
        if (not_good && growth > 0 && cgraph_estimate_growth (edge->callee) > 0)
         {
@@ -1120,7 +1215,7 @@ cgraph_decide_inlining_of_small_functions (void)
             continue;
           if (flag_indirect_inlining)
             add_new_edges_to_heap (heap, new_indirect_edges);
-          update_callee_keys (heap, where, updated_nodes);
+          update_all_callee_keys (heap, where, updated_nodes);
         }
        else
         {
@@ -1136,11 +1231,18 @@ cgraph_decide_inlining_of_small_functions (void)
               continue;
             }
           callee = edge->callee;
+         gcc_checking_assert (!callee->global.inlined_to);
           cgraph_mark_inline_edge (edge, true, &new_indirect_edges);
           if (flag_indirect_inlining)
             add_new_edges_to_heap (heap, new_indirect_edges);
  
-         update_callee_keys (heap, callee, updated_nodes);
+         /* We inlined last offline copy to the body.  This might lead
+            to callees of function having fewer call sites and thus they
+            may need updating.  */
+         if (callee->global.inlined_to)
+           update_all_callee_keys (heap, callee, updated_nodes);
+         else
+           update_callee_keys (heap, edge->callee, updated_nodes);
         }
        where = edge->caller;
        if (where->global.inlined_to)
@@ -1189,7 +1291,7 @@ cgraph_decide_inlining_of_small_functions (void)
        if (!edge->inline_failed)
         continue;
  #ifdef ENABLE_CHECKING
-      gcc_assert (cgraph_edge_badness (edge, false) == badness);
+      gcc_assert (cgraph_edge_badness (edge, false) >= badness);
  #endif
        if (dump_file)
         {
@@ -1396,14 +1498,13 @@ cgraph_decide_inlining (void)
  
           if (node->callers
               && !node->callers->next_caller
-             && cgraph_only_called_directly_p (node)
+             && cgraph_will_be_removed_from_program_if_no_direct_calls (node)
               && node->local.inlinable
               && node->callers->inline_failed
               && node->callers->caller != node
               && node->callers->caller->global.inlined_to != node
               && !node->callers->call_stmt_cannot_inline_p
-             && !DECL_EXTERNAL (node->decl)
-             && !DECL_COMDAT (node->decl))
+             && !DECL_EXTERNAL (node->decl))
             {
               cgraph_inline_failed_t reason;
               old_size = overall_size;
@@ -1657,7 +1758,7 @@ cgraph_early_inlining (void)
    unsigned int todo = 0;
    int iterations = 0;
  
-  if (sorrycount || errorcount)
+  if (seen_error ())
      return 0;
  
    if (!optimize
@@ -1786,10 +1887,12 @@ likely_eliminated_by_inlining_p (gimple stmt)
             bool rhs_free = false;
             bool lhs_free = false;
  
-           while (handled_component_p (inner_lhs) || TREE_CODE (inner_lhs) == INDIRECT_REF)
+           while (handled_component_p (inner_lhs)
+                  || TREE_CODE (inner_lhs) == MEM_REF)
               inner_lhs = TREE_OPERAND (inner_lhs, 0);
             while (handled_component_p (inner_rhs)
-                  || TREE_CODE (inner_rhs) == ADDR_EXPR || TREE_CODE (inner_rhs) == INDIRECT_REF)
+                  || TREE_CODE (inner_rhs) == ADDR_EXPR
+                  || TREE_CODE (inner_rhs) == MEM_REF)
               inner_rhs = TREE_OPERAND (inner_rhs, 0);
  
  
@@ -1809,7 +1912,8 @@ likely_eliminated_by_inlining_p (gimple stmt)
                 || (TREE_CODE (inner_lhs) == SSA_NAME
                     && TREE_CODE (SSA_NAME_VAR (inner_lhs)) == RESULT_DECL))
               lhs_free = true;
-           if (lhs_free && (is_gimple_reg (rhs) || is_gimple_min_invariant (rhs)))
+           if (lhs_free
+               && (is_gimple_reg (rhs) || is_gimple_min_invariant (rhs)))
               rhs_free = true;
             if (lhs_free && rhs_free)
               return true;
@@ -1836,14 +1940,6 @@ estimate_function_body_sizes (struct cgraph_node *node)
    int freq;
    tree funtype = TREE_TYPE (node->decl);
  
-  if (node->local.disregard_inline_limits)
-    {
-      inline_summary (node)->self_time = 0;
-      inline_summary (node)->self_size = 0;
-      inline_summary (node)->time_inlining_benefit = 0;
-      inline_summary (node)->size_inlining_benefit = 0;
-    }
-
    if (dump_file)
      fprintf (dump_file, "Analyzing function body size: %s\n",
              cgraph_node_name (node));
@@ -1893,7 +1989,7 @@ estimate_function_body_sizes (struct cgraph_node *node)
        time_inlining_benefit += cost;
        size_inlining_benefit += cost;
      }
-  for (arg = DECL_ARGUMENTS (node->decl); arg; arg = TREE_CHAIN (arg))
+  for (arg = DECL_ARGUMENTS (node->decl); arg; arg = DECL_CHAIN (arg))
      if (!VOID_TYPE_P (TREE_TYPE (arg)))
        {
          int cost = estimate_move_cost (TREE_TYPE (arg));
@@ -1924,7 +2020,7 @@ compute_inline_parameters (struct cgraph_node *node)
  
    /* Estimate the stack size for the function.  But not at -O0
       because estimated_stack_frame_size is a quadratic problem.  */
-  self_stack_size = optimize ? estimated_stack_frame_size () : 0;
+  self_stack_size = optimize ? estimated_stack_frame_size (node->decl) : 0;
    inline_summary (node)->estimated_self_stack_size = self_stack_size;
    node->global.estimated_stack_size = self_stack_size;
    node->global.stack_frame_offset = 0;
@@ -1975,23 +2071,8 @@ struct gimple_opt_pass pass_inline_parameters =
  static void
  inline_indirect_intraprocedural_analysis (struct cgraph_node *node)
  {
-  struct cgraph_edge *cs;
-
-  if (!flag_ipa_cp)
-    {
-      ipa_initialize_node_params (node);
-      ipa_detect_param_modifications (node);
-    }
-  ipa_analyze_params_uses (node);
-
-  if (!flag_ipa_cp)
-    for (cs = node->callees; cs; cs = cs->next_callee)
-      {
-       ipa_count_arguments (cs);
-       ipa_compute_jump_functions (cs);
-      }
-
-  if (dump_file)
+  ipa_analyze_node (node);
+  if (dump_file && (dump_flags & TDF_DETAILS))
      {
        ipa_print_node_params (dump_file, node);
        ipa_print_node_jump_functions (dump_file, node);
@@ -2006,7 +2087,9 @@ analyze_function (struct cgraph_node *node)
    current_function_decl = node->decl;
  
    compute_inline_parameters (node);
-  if (flag_indirect_inlining)
+  /* FIXME: We should remove the optimize check after we ensure we never run
+     IPA passes when not optimizng.  */
+  if (flag_indirect_inlining && optimize)
      inline_indirect_intraprocedural_analysis (node);
  
    current_function_decl = NULL;
@@ -2049,6 +2132,7 @@ inline_transform (struct cgraph_node *node)
  {
    unsigned int todo = 0;
    struct cgraph_edge *e;
+  bool inline_p = false;
  
    /* FIXME: Currently the passmanager is adding inline transform more than once to some
       clones.  This needs revisiting after WPA cleanups.  */
@@ -2061,10 +2145,13 @@ inline_transform (struct cgraph_node *node)
      save_inline_function_body (node);
  
    for (e = node->callees; e; e = e->next_callee)
-    if (!e->inline_failed || warn_inline)
-      break;
+    {
+      cgraph_redirect_edge_call_stmt_to_callee (e);
+      if (!e->inline_failed || warn_inline)
+        inline_p = true;
+    }
  
-  if (e)
+  if (inline_p)
      {
        timevar_push (TV_INTEGRATION);
        todo = optimize_inline_calls (current_function_decl);
@@ -2097,7 +2184,8 @@ inline_read_summary (void)
     active, we don't need to write them twice.  */
  
  static void
-inline_write_summary (cgraph_node_set set)
+inline_write_summary (cgraph_node_set set,
+                     varpool_node_set vset ATTRIBUTE_UNUSED)
  {
    if (flag_indirect_inlining && !flag_ipa_cp)
      ipa_prop_write_jump_functions (set);
@@ -2133,7 +2221,7 @@ struct ipa_opt_pass_d pass_ipa_inline =
    0,                                   /* properties_destroyed */
    TODO_remove_functions,               /* todo_flags_finish */
    TODO_dump_cgraph | TODO_dump_func
-  | TODO_remove_functions              /* todo_flags_finish */
+  | TODO_remove_functions | TODO_ggc_collect   /* todo_flags_finish */
   },
   inline_generate_summary,              /* generate_summary */
   inline_write_summary,                 /* write_summary */