modulo-sched: speed up DDG analysis (PR90001)

PR rtl-optimization/90001
	* ddg.c (create_ddg): Init max_dist array for each node.
	(free_ddg): Free max_dist array.
	(create_ddg_edge): Use bool field instead of aux union.
	(set_recurrence_length): Use prepared max_dist information instead
	of calling longest_simple_path.
	(create_scc): Remove graph argument, fill node's aux.count with
	SCC id, and move set_recurrence_length call to...
	(create_ddg_all_sccs): ...here, after filling all max_dist arrays
	using Floyd–Warshall-like algorithm.
	(update_dist_to_successors): Remove the whole function.
	(longest_simple_path): Likewise.
	* ddg.h (struct ddg_node): Add max_dist pointer.
	(struct ddg_edge): Use bool field instead of unused aux union.

From-SVN: r279375
This commit is contained in:
Roman Zhuykov 2019-12-13 17:02:53 +00:00 committed by Roman Zhuykov
parent 7b945b19ad
commit 728c2e5eea
3 changed files with 87 additions and 94 deletions

View file

@ -1,3 +1,19 @@
2019-12-13 Roman Zhuykov <zhroma@ispras.ru>
* ddg.c (create_ddg): Init max_dist array for each node.
(free_ddg): Free max_dist array.
(create_ddg_edge): Use bool field instead of aux union.
(set_recurrence_length): Use prepared max_dist information instead
of calling longest_simple_path.
(create_scc): Remove graph argument, fill node's aux.count with
SCC id, and move set_recurrence_length call to...
(create_ddg_all_sccs): ...here, after filling all max_dist arrays
using FloydWarshall-like algorithm.
(update_dist_to_successors): Remove the whole function.
(longest_simple_path): Likewise.
* ddg.h (struct ddg_node): Add max_dist pointer.
(struct ddg_edge): Use bool field instead of unused aux union.
2019-12-13 Andrew Stubbs <ams@codesourcery.com>
* config/gcn/gcn-valu.md (mulv64si3<exec>): Rename to ...

153
gcc/ddg.c
View file

@ -32,9 +32,6 @@ along with GCC; see the file COPYING3. If not see
#ifdef INSN_SCHEDULING
/* A flag indicating that a ddg edge belongs to an SCC or not. */
enum edge_flag {NOT_IN_SCC = 0, IN_SCC};
/* Forward declarations. */
static void add_backarc_to_ddg (ddg_ptr, ddg_edge_ptr);
static void add_backarc_to_scc (ddg_scc_ptr, ddg_edge_ptr);
@ -564,7 +561,7 @@ create_ddg (basic_block bb, int closing_branch_deps)
{
ddg_ptr g;
rtx_insn *insn, *first_note;
int i;
int i, j;
int num_nodes = 0;
g = (ddg_ptr) xcalloc (1, sizeof (struct ddg));
@ -632,6 +629,12 @@ create_ddg (basic_block bb, int closing_branch_deps)
g->nodes[i].predecessors = sbitmap_alloc (num_nodes);
bitmap_clear (g->nodes[i].predecessors);
g->nodes[i].first_note = (first_note ? first_note : insn);
g->nodes[i].aux.count = -1;
g->nodes[i].max_dist = XCNEWVEC (int, num_nodes);
for (j = 0; j < num_nodes; j++)
g->nodes[i].max_dist[j] = -1;
g->nodes[i++].insn = insn;
first_note = NULL;
}
@ -668,6 +671,7 @@ free_ddg (ddg_ptr g)
}
sbitmap_free (g->nodes[i].successors);
sbitmap_free (g->nodes[i].predecessors);
free (g->nodes[i].max_dist);
}
if (g->num_backarcs > 0)
free (g->backarcs);
@ -792,7 +796,7 @@ create_ddg_edge (ddg_node_ptr src, ddg_node_ptr dest,
e->latency = l;
e->distance = d;
e->next_in = e->next_out = NULL;
e->aux.info = 0;
e->in_scc = false;
return e;
}
@ -820,7 +824,7 @@ add_edge_to_ddg (ddg_ptr g ATTRIBUTE_UNUSED, ddg_edge_ptr e)
for now that cycles in the data dependence graph contain a single backarc.
This simplifies the algorithm, and can be generalized later. */
static void
set_recurrence_length (ddg_scc_ptr scc, ddg_ptr g)
set_recurrence_length (ddg_scc_ptr scc)
{
int j;
int result = -1;
@ -828,17 +832,14 @@ set_recurrence_length (ddg_scc_ptr scc, ddg_ptr g)
for (j = 0; j < scc->num_backarcs; j++)
{
ddg_edge_ptr backarc = scc->backarcs[j];
int length;
int distance = backarc->distance;
ddg_node_ptr src = backarc->dest;
ddg_node_ptr dest = backarc->src;
int length = src->max_dist[dest->cuid];
if (length < 0)
continue;
length = longest_simple_path (g, src->cuid, dest->cuid, scc->nodes);
if (length < 0 )
{
/* fprintf (stderr, "Backarc not on simple cycle in SCC.\n"); */
continue;
}
length += backarc->latency;
result = MAX (result, (length / distance));
}
@ -846,9 +847,9 @@ set_recurrence_length (ddg_scc_ptr scc, ddg_ptr g)
}
/* Create a new SCC given the set of its nodes. Compute its recurrence_length
and mark edges that belong to this scc as IN_SCC. */
and mark edges that belong to this scc. */
static ddg_scc_ptr
create_scc (ddg_ptr g, sbitmap nodes)
create_scc (ddg_ptr g, sbitmap nodes, int id)
{
ddg_scc_ptr scc;
unsigned int u = 0;
@ -866,16 +867,18 @@ create_scc (ddg_ptr g, sbitmap nodes)
ddg_edge_ptr e;
ddg_node_ptr n = &g->nodes[u];
gcc_assert (n->aux.count == -1);
n->aux.count = id;
for (e = n->out; e; e = e->next_out)
if (bitmap_bit_p (nodes, e->dest->cuid))
{
e->aux.count = IN_SCC;
e->in_scc = true;
if (e->distance > 0)
add_backarc_to_scc (scc, e);
}
}
set_recurrence_length (scc, g);
return scc;
}
@ -1018,7 +1021,7 @@ check_sccs (ddg_all_sccs_ptr sccs, int num_nodes)
ddg_all_sccs_ptr
create_ddg_all_sccs (ddg_ptr g)
{
int i;
int i, j, k, scc, way;
int num_nodes = g->num_nodes;
auto_sbitmap from (num_nodes);
auto_sbitmap to (num_nodes);
@ -1038,7 +1041,7 @@ create_ddg_all_sccs (ddg_ptr g)
ddg_node_ptr dest = backarc->dest;
/* If the backarc already belongs to an SCC, continue. */
if (backarc->aux.count == IN_SCC)
if (backarc->in_scc)
continue;
bitmap_clear (scc_nodes);
@ -1049,10 +1052,52 @@ create_ddg_all_sccs (ddg_ptr g)
if (find_nodes_on_paths (scc_nodes, g, from, to))
{
scc = create_scc (g, scc_nodes);
scc = create_scc (g, scc_nodes, sccs->num_sccs);
add_scc_to_ddg (sccs, scc);
}
}
/* Init max_dist arrays for FloydWarshall-like
longest patch calculation algorithm. */
for (k = 0; k < num_nodes; k++)
{
ddg_edge_ptr e;
ddg_node_ptr n = &g->nodes[k];
if (n->aux.count == -1)
continue;
n->max_dist[k] = 0;
for (e = n->out; e; e = e->next_out)
if (e->distance == 0 && g->nodes[e->dest->cuid].aux.count == n->aux.count)
n->max_dist[e->dest->cuid] = e->latency;
}
/* Run main Floid-Warshall loop. We use only non-backarc edges
inside each scc. */
for (k = 0; k < num_nodes; k++)
{
scc = g->nodes[k].aux.count;
if (scc != -1)
{
for (i = 0; i < num_nodes; i++)
if (g->nodes[i].aux.count == scc)
for (j = 0; j < num_nodes; j++)
if (g->nodes[j].aux.count == scc
&& g->nodes[i].max_dist[k] >= 0
&& g->nodes[k].max_dist[j] >= 0)
{
way = g->nodes[i].max_dist[k] + g->nodes[k].max_dist[j];
if (g->nodes[i].max_dist[j] < way)
g->nodes[i].max_dist[j] = way;
}
}
}
/* Calculate recurrence_length using max_dist info. */
for (i = 0; i < sccs->num_sccs; i++)
set_recurrence_length (sccs->sccs[i]);
order_sccs (sccs);
if (flag_checking)
@ -1155,72 +1200,4 @@ find_nodes_on_paths (sbitmap result, ddg_ptr g, sbitmap from, sbitmap to)
return bitmap_and (result, reachable_from, reach_to);
}
/* Updates the counts of U_NODE's successors (that belong to NODES) to be
at-least as large as the count of U_NODE plus the latency between them.
Sets a bit in TMP for each successor whose count was changed (increased).
Returns nonzero if any count was changed. */
static int
update_dist_to_successors (ddg_node_ptr u_node, sbitmap nodes, sbitmap tmp)
{
ddg_edge_ptr e;
int result = 0;
for (e = u_node->out; e; e = e->next_out)
{
ddg_node_ptr v_node = e->dest;
int v = v_node->cuid;
if (bitmap_bit_p (nodes, v)
&& (e->distance == 0)
&& (v_node->aux.count < u_node->aux.count + e->latency))
{
v_node->aux.count = u_node->aux.count + e->latency;
bitmap_set_bit (tmp, v);
result = 1;
}
}
return result;
}
/* Find the length of a longest path from SRC to DEST in G,
going only through NODES, and disregarding backarcs. */
int
longest_simple_path (struct ddg * g, int src, int dest, sbitmap nodes)
{
int i;
unsigned int u = 0;
int change = 1;
int num_nodes = g->num_nodes;
auto_sbitmap workset (num_nodes);
auto_sbitmap tmp (num_nodes);
/* Data will hold the distance of the longest path found so far from
src to each node. Initialize to -1 = less than minimum. */
for (i = 0; i < g->num_nodes; i++)
g->nodes[i].aux.count = -1;
g->nodes[src].aux.count = 0;
bitmap_clear (tmp);
bitmap_set_bit (tmp, src);
while (change)
{
sbitmap_iterator sbi;
change = 0;
bitmap_copy (workset, tmp);
bitmap_clear (tmp);
EXECUTE_IF_SET_IN_BITMAP (workset, 0, u, sbi)
{
ddg_node_ptr u_node = &g->nodes[u];
change |= update_dist_to_successors (u_node, nodes, tmp);
}
}
return g->nodes[dest].aux.count;
}
#endif /* INSN_SCHEDULING */

View file

@ -64,6 +64,10 @@ struct ddg_node
sbitmap successors;
sbitmap predecessors;
/* Temporary array used for Floyd-Warshall algorithm to find
scc recurrence length. */
int *max_dist;
/* For general use by algorithms manipulating the ddg. */
union {
int count;
@ -95,11 +99,8 @@ struct ddg_edge
ddg_edge_ptr next_in;
ddg_edge_ptr next_out;
/* For general use by algorithms manipulating the ddg. */
union {
int count;
void *info;
} aux;
/* Is true when edge is already in scc. */
bool in_scc;
};
/* This structure holds the Data Dependence Graph for a basic block. */
@ -178,7 +179,6 @@ ddg_all_sccs_ptr create_ddg_all_sccs (ddg_ptr);
void free_ddg_all_sccs (ddg_all_sccs_ptr);
int find_nodes_on_paths (sbitmap result, ddg_ptr, sbitmap from, sbitmap to);
int longest_simple_path (ddg_ptr, int from, int to, sbitmap via);
bool autoinc_var_is_used_p (rtx_insn *, rtx_insn *);