+2015-03-21 Tom de Vries <tom@codesourcery.com>
+
+ PR tree-optimization/65458
+ * cgraph.c (cgraph_node::dump): Handle parallelized_function field.
+ * cgraph.h (cgraph_node): Add parallelized_function field.
+ * lto-cgraph.c (lto_output_node): Write parallelized_function field.
+ (input_overwrite_node): Read parallelized_function field.
+ * omp-low.c (expand_omp_taskreg, finalize_task_copyfn): Set
+ parallelized_function on cgraph_node for child_fn.
+ * tree-parloops.c: Add include of plugin-api.h, ipa-ref.h and cgraph.h.
+ Remove include of gt-tree-parloops.h.
+ (parallelized_functions): Remove static variable.
+ (parallelized_function_p): Rewrite using parallelized_function field of
+ cgraph_node.
+ (create_loop_fn): Remove adding to parallelized_functions.
+ * Makefile.in (GTFILES): Remove tree-parloops.c
+
2015-03-20 Vladimir Makarov <vmakarov@redhat.com>
PR rtl-optimization/64366
$(srcdir)/tree-scalar-evolution.c \
$(srcdir)/tree-ssa-operands.h \
$(srcdir)/tree-profile.c $(srcdir)/tree-nested.c \
- $(srcdir)/tree-parloops.c \
$(srcdir)/omp-low.c \
$(srcdir)/omp-low.h \
$(srcdir)/targhooks.c $(out_file) $(srcdir)/passes.c $(srcdir)/cgraphunit.c \
fprintf (f, " only_called_at_exit");
if (opt_for_fn (decl, optimize_size))
fprintf (f, " optimize_size");
+ if (parallelized_function)
+ fprintf (f, " parallelized_function");
fprintf (f, "\n");
unsigned nonfreeing_fn : 1;
/* True if there was multiple COMDAT bodies merged by lto-symtab. */
unsigned merged : 1;
+ /* True if function was created to be executed in parallel. */
+ unsigned parallelized_function : 1;
private:
/* Worker for call_for_symbol_and_aliases. */
bp_pack_value (&bp, node->icf_merged, 1);
bp_pack_value (&bp, node->nonfreeing_fn, 1);
bp_pack_value (&bp, node->thunk.thunk_p, 1);
+ bp_pack_value (&bp, node->parallelized_function, 1);
bp_pack_enum (&bp, ld_plugin_symbol_resolution,
LDPR_NUM_KNOWN, node->resolution);
bp_pack_value (&bp, node->instrumentation_clone, 1);
node->icf_merged = bp_unpack_value (bp, 1);
node->nonfreeing_fn = bp_unpack_value (bp, 1);
node->thunk.thunk_p = bp_unpack_value (bp, 1);
+ node->parallelized_function = bp_unpack_value (bp, 1);
node->resolution = bp_unpack_enum (bp, ld_plugin_symbol_resolution,
LDPR_NUM_KNOWN);
node->instrumentation_clone = bp_unpack_value (bp, 1);
/* Inform the callgraph about the new function. */
cgraph_node::add_new_function (child_fn, false);
+ cgraph_node::get (child_fn)->parallelized_function = 1;
}
/* Destroy a omp_context data structures. Called through the splay tree
/* Inform the callgraph about the new function. */
DECL_STRUCT_FUNCTION (child_fn)->curr_properties = cfun->curr_properties;
cgraph_node::add_new_function (child_fn, true);
+ cgraph_node::get (child_fn)->parallelized_function = 1;
/* Fix the callgraph edges for child_cfun. Those for cfun will be
fixed in a following pass. */
#include "tree-parloops.h"
#include "omp-low.h"
#include "tree-nested.h"
+#include "plugin-api.h"
+#include "ipa-ref.h"
+#include "cgraph.h"
/* This pass tries to distribute iterations of loops into several threads.
The implementation is straightforward -- for each loop we test whether its
}
}
-/* Bitmap containing uids of functions created by parallelization. We cannot
- allocate it from the default obstack, as it must live across compilation
- of several functions; we make it gc allocated instead. */
-
-static GTY(()) bitmap parallelized_functions;
-
-/* Returns true if FN was created by create_loop_fn. */
+/* Returns true if FN was created to run in parallel. */
bool
-parallelized_function_p (tree fn)
+parallelized_function_p (tree fndecl)
{
- if (!parallelized_functions || !DECL_ARTIFICIAL (fn))
- return false;
-
- return bitmap_bit_p (parallelized_functions, DECL_UID (fn));
+ cgraph_node *node = cgraph_node::get (fndecl);
+ gcc_assert (node != NULL);
+ return node->parallelized_function;
}
/* Creates and returns an empty function that will receive the body of
type = build_function_type_list (void_type_node, ptr_type_node, NULL_TREE);
decl = build_decl (loc, FUNCTION_DECL, name, type);
- if (!parallelized_functions)
- parallelized_functions = BITMAP_GGC_ALLOC ();
- bitmap_set_bit (parallelized_functions, DECL_UID (decl));
-
TREE_STATIC (decl) = 1;
TREE_USED (decl) = 1;
DECL_ARTIFICIAL (decl) = 1;
{
return new pass_parallelize_loops (ctxt);
}
-
-
-#include "gt-tree-parloops.h"