Commit 204b560f by Sebastian Pop Committed by Sebastian Pop

New implementation of Graphite.

2009-07-30  Sebastian Pop  <sebastian.pop@amd.com>

	* Makefile.in (OBJS-common): Added dependence on graphite-blocking.o,
	graphite-clast-to-gimple.o, graphite-dependences.o,
	graphite-interchange.o, graphite-poly.o, graphite-ppl.o,
	graphite-scop-detection.o, graphite-sese-to-poly.o, and sese.o.
	(graphite-blocking.o,
	graphite-clast-to-gimple.o, graphite-dependences.o,
	graphite-interchange.o, graphite-poly.o, graphite-ppl.o,
	graphite-scop-detection.o, graphite-sese-to-poly.o, and sese.o): New.
	* cfgloop.c (alloc_loop): Set loop->can_be_parallel to false.
	* cfgloop.h (struct loop): Add can_be_parallel field.
	* common.opt (fgraphite-identity): Moved up.
	(fgraphite-force-parallel): New flag.
	* graphite.c: Rewrite.
	* graphite.h: Rewrite.
	* passes.c (init_optimization_passes): Schedule a pass of DCE and LIM
	after Graphite.
	* toplev.c (graphite_out_file): New file descriptor.
	(graphite_in_file): New.
	(process_options): flag_graphite_force_parallel cannot be used without
	Graphite.
	* tree-ssa-loop.c: Include toplev.h.
	(gate_graphite_transforms): Enable flag_graphite for
	flag_graphite_force_parallel.

From-SVN: r150301
parent 2abae5f1
2009-07-30 Sebastian Pop <sebastian.pop@amd.com> 2009-07-30 Sebastian Pop <sebastian.pop@amd.com>
* Makefile.in (OBJS-common): Added dependence on graphite-blocking.o,
graphite-clast-to-gimple.o, graphite-dependences.o,
graphite-interchange.o, graphite-poly.o, graphite-ppl.o,
graphite-scop-detection.o, graphite-sese-to-poly.o, and sese.o.
(graphite-blocking.o,
graphite-clast-to-gimple.o, graphite-dependences.o,
graphite-interchange.o, graphite-poly.o, graphite-ppl.o,
graphite-scop-detection.o, graphite-sese-to-poly.o, and sese.o): New.
* cfgloop.c (alloc_loop): Set loop->can_be_parallel to false.
* cfgloop.h (struct loop): Add can_be_parallel field.
* common.opt (fgraphite-identity): Moved up.
(fgraphite-force-parallel): New flag.
* graphite.c: Rewrite.
* graphite.h: Rewrite.
* passes.c (init_optimization_passes): Schedule a pass of DCE and LIM
after Graphite.
* toplev.c (graphite_out_file): New file descriptor.
(graphite_in_file): New.
(process_options): flag_graphite_force_parallel cannot be used without
Graphite.
* tree-ssa-loop.c: Include toplev.h.
(gate_graphite_transforms): Enable flag_graphite for
flag_graphite_force_parallel.
2009-07-30 Sebastian Pop <sebastian.pop@amd.com>
* ChangeLog.graphite: New. * ChangeLog.graphite: New.
* graphite-blocking.c: New. * graphite-blocking.c: New.
* graphite-clast-to-gimple.c: New. * graphite-clast-to-gimple.c: New.
......
...@@ -1178,6 +1178,14 @@ OBJS-common = \ ...@@ -1178,6 +1178,14 @@ OBJS-common = \
graph.o \ graph.o \
graphds.o \ graphds.o \
graphite.o \ graphite.o \
graphite-blocking.o \
graphite-clast-to-gimple.o \
graphite-dependences.o \
graphite-interchange.o \
graphite-poly.o \
graphite-ppl.o \
graphite-scop-detection.o \
graphite-sese-to-poly.o \
gtype-desc.o \ gtype-desc.o \
haifa-sched.o \ haifa-sched.o \
hooks.o \ hooks.o \
...@@ -1251,6 +1259,7 @@ OBJS-common = \ ...@@ -1251,6 +1259,7 @@ OBJS-common = \
sel-sched-ir.o \ sel-sched-ir.o \
sel-sched-dump.o \ sel-sched-dump.o \
sel-sched.o \ sel-sched.o \
sese.o \
simplify-rtx.o \ simplify-rtx.o \
sparseset.o \ sparseset.o \
sreal.o \ sreal.o \
...@@ -2450,11 +2459,64 @@ tree-data-ref.o: tree-data-ref.c $(CONFIG_H) $(SYSTEM_H) coretypes.h $(TM_H) \ ...@@ -2450,11 +2459,64 @@ tree-data-ref.o: tree-data-ref.c $(CONFIG_H) $(SYSTEM_H) coretypes.h $(TM_H) \
$(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) \ $(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) \
$(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) \ $(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) \
$(TREE_DATA_REF_H) $(TREE_PASS_H) langhooks.h $(TREE_DATA_REF_H) $(TREE_PASS_H) langhooks.h
sese.o: sese.c $(CONFIG_H) $(SYSTEM_H) coretypes.h $(TM_H) \
$(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) $(TOPLEV_H) \
$(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) $(GIMPLE_H) \
domwalk.h pointer-set.h value-prof.h
graphite.o: graphite.c $(CONFIG_H) $(SYSTEM_H) coretypes.h $(TM_H) \ graphite.o: graphite.c $(CONFIG_H) $(SYSTEM_H) coretypes.h $(TM_H) \
$(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) $(TOPLEV_H) \ $(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) $(TOPLEV_H) \
$(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) $(GIMPLE_H) \ $(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) $(GIMPLE_H) \
$(TREE_DATA_REF_H) $(SCEV_H) $(TREE_PASS_H) tree-chrec.h graphite.h \ $(TREE_DATA_REF_H) tree-pass.h graphite.h \
pointer-set.h value-prof.h pointer-set.h value-prof.h graphite-ppl.h sese.h \
graphite-scop-detection.h graphite-clast-to-gimple.h \
graphite-poly.h graphite-sese-to-poly.h
graphite-blocking.o: graphite-blocking.c $(CONFIG_H) $(SYSTEM_H) \
coretypes.h \
$(TM_H) $(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) \
$(TOPLEV_H) $(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) \
$(GIMPLE_H) $(TREE_DATA_REF_H) tree-pass.h \
graphite.h graphite-poly.h graphite-ppl.h
graphite-clast-to-gimple.o: graphite-clast-to-gimple.c $(CONFIG_H) \
$(SYSTEM_H) coretypes.h $(TM_H) \
$(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) $(TOPLEV_H) \
$(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) $(GIMPLE_H) \
$(TREE_DATA_REF_H) tree-pass.h graphite.h \
pointer-set.h value-prof.h graphite-ppl.h sese.h \
graphite-scop-detection.h graphite-clast-to-gimple.h graphite-poly.h \
graphite-dependences.h
graphite-dependences.o: graphite-dependences.c $(CONFIG_H) $(SYSTEM_H) \
coretypes.h \
$(TM_H) $(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) \
$(TOPLEV_H) $(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) \
$(GIMPLE_H) $(TREE_DATA_REF_H) tree-pass.h \
graphite.h graphite-poly.h graphite-ppl.h graphite-dependences.h
graphite-interchange.o: graphite-interchange.c $(CONFIG_H) $(SYSTEM_H) \
coretypes.h \
$(TM_H) $(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) \
$(TOPLEV_H) $(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) \
$(GIMPLE_H) $(TREE_DATA_REF_H) tree-pass.h \
graphite.h graphite-poly.h graphite-ppl.h
graphite-poly.o: graphite-poly.c $(CONFIG_H) $(SYSTEM_H) coretypes.h $(TM_H) \
$(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) $(TOPLEV_H) \
$(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) $(GIMPLE_H) \
$(TREE_DATA_REF_H) tree-pass.h graphite.h graphite-dependences.h \
pointer-set.h value-prof.h graphite-ppl.h sese.h output.h graphite-poly.h
graphite-ppl.o: graphite-ppl.c $(CONFIG_H) $(SYSTEM_H) coretypes.h $(TM_H) \
$(GGC_H) graphite-ppl.h
graphite-scop-detection.o: graphite-scop-detection.c $(CONFIG_H) $(SYSTEM_H) \
$(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) $(TOPLEV_H) \
$(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) $(GIMPLE_H) \
$(TREE_DATA_REF_H) tree-pass.h graphite.h $(TM_H) \
value-prof.h graphite-ppl.h sese.h pointer-set.h coretypes.h \
graphite-scop-detection.h graphite-poly.h
graphite-sese-to-poly.o: graphite-sese-to-poly.c $(CONFIG_H) \
$(SYSTEM_H) coretypes.h $(TM_H) \
$(GGC_H) $(TREE_H) $(RTL_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) $(TOPLEV_H) \
$(TREE_FLOW_H) $(TREE_DUMP_H) $(TIMEVAR_H) $(CFGLOOP_H) $(GIMPLE_H) \
$(TREE_DATA_REF_H) tree-pass.h graphite.h \
pointer-set.h value-prof.h graphite-ppl.h sese.h \
graphite-scop-detection.h graphite-sese-to-poly.h $(PARAMS_H) \
graphite-clast-to-gimple.h graphite-poly.h
tree-vect-loop.o: tree-vect-loop.c $(CONFIG_H) $(SYSTEM_H) coretypes.h \ tree-vect-loop.o: tree-vect-loop.c $(CONFIG_H) $(SYSTEM_H) coretypes.h \
$(TM_H) $(GGC_H) $(TREE_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) $(TREE_FLOW_H) \ $(TM_H) $(GGC_H) $(TREE_H) $(BASIC_BLOCK_H) $(DIAGNOSTIC_H) $(TREE_FLOW_H) \
$(TREE_DUMP_H) $(CFGLOOP_H) $(EXPR_H) $(RECOG_H) $(OPTABS_H) $(TOPLEV_H) \ $(TREE_DUMP_H) $(CFGLOOP_H) $(EXPR_H) $(RECOG_H) $(OPTABS_H) $(TOPLEV_H) \
......
...@@ -338,6 +338,7 @@ alloc_loop (void) ...@@ -338,6 +338,7 @@ alloc_loop (void)
loop->exits = GGC_CNEW (struct loop_exit); loop->exits = GGC_CNEW (struct loop_exit);
loop->exits->next = loop->exits->prev = loop->exits; loop->exits->next = loop->exits->prev = loop->exits;
loop->can_be_parallel = false;
return loop; return loop;
} }
......
...@@ -157,6 +157,9 @@ struct GTY ((chain_next ("%h.next"))) loop { ...@@ -157,6 +157,9 @@ struct GTY ((chain_next ("%h.next"))) loop {
/* Head of the cyclic list of the exits of the loop. */ /* Head of the cyclic list of the exits of the loop. */
struct loop_exit *exits; struct loop_exit *exits;
/* True if the loop can be parallel. */
bool can_be_parallel;
}; };
/* Flags for state of loop structure. */ /* Flags for state of loop structure. */
......
...@@ -571,6 +571,16 @@ fgraphite ...@@ -571,6 +571,16 @@ fgraphite
Common Report Var(flag_graphite) Common Report Var(flag_graphite)
Enable in and out of Graphite representation Enable in and out of Graphite representation
; This option is not documented as it does not perform any useful optimization.
fgraphite-identity
Common Report Var(flag_graphite_identity) Optimization
Enable Graphite Identity transformation
; This option is not documented as it will be removed
fgraphite-force-parallel
Common Report Var(flag_graphite_force_parallel) Optimization
Mark all loops as parallel
floop-strip-mine floop-strip-mine
Common Report Var(flag_loop_strip_mine) Optimization Common Report Var(flag_loop_strip_mine) Optimization
Enable Loop Strip Mining transformation Enable Loop Strip Mining transformation
...@@ -583,11 +593,6 @@ floop-block ...@@ -583,11 +593,6 @@ floop-block
Common Report Var(flag_loop_block) Optimization Common Report Var(flag_loop_block) Optimization
Enable Loop Blocking transformation Enable Loop Blocking transformation
; This option is not documented as it does not perform any useful optimization.
fgraphite-identity
Common Report Var(flag_graphite_identity) Optimization
Enable Graphite Identity transformation
fguess-branch-probability fguess-branch-probability
Common Report Var(flag_guess_branch_prob) Optimization Common Report Var(flag_guess_branch_prob) Optimization
Enable guessing of branch probabilities Enable guessing of branch probabilities
......
This source diff could not be displayed because it is too large. You can view the blob instead.
...@@ -21,556 +21,4 @@ along with GCC; see the file COPYING3. If not see ...@@ -21,556 +21,4 @@ along with GCC; see the file COPYING3. If not see
#ifndef GCC_GRAPHITE_H #ifndef GCC_GRAPHITE_H
#define GCC_GRAPHITE_H #define GCC_GRAPHITE_H
#include "tree-data-ref.h"
int ref_nb_loops (data_reference_p);
typedef struct graphite_bb *graphite_bb_p;
DEF_VEC_P(graphite_bb_p);
DEF_VEC_ALLOC_P (graphite_bb_p, heap);
DEF_VEC_P(scop_p);
DEF_VEC_ALLOC_P (scop_p, heap);
static inline int scop_nb_loops (scop_p scop);
static inline unsigned scop_nb_params (scop_p scop);
static inline bool scop_contains_loop (scop_p scop, struct loop *loop);
typedef struct graphite_bb
{
basic_block bb;
scop_p scop;
/* The static schedule contains the textual order for every loop layer.
Example:
S0
for (i ...)
{
S1
for (j ...)
{
S2
S3
}
S4
}
S5
for (k ...)
{
S6
S7
for (l ...)
{
S8
}
S9
}
S10
Schedules:
| Depth
BB | 0 1 2
------------
S0 | 0
S1 | 1, 0
S2 | 1, 1, 0
S3 | 1, 1, 1
S4 | 1, 2
S5 | 2
S6 | 3, 0
S7 | 3, 1
S8 | 3, 2, 0
S9 | 3, 3
S10| 4
Normalization rules:
- One SCoP can never contain two bbs with the same schedule timestamp.
- All bbs at the same loop depth have a consecutive ordering (no gaps). */
lambda_vector static_schedule;
/* The iteration domain of this bb. It contains this columns:
- In/Eq: If this line is a equation or inequation.
- For every loop iterator one column.
- One column for every parameter in this SCoP.
- The constant column to add integers to the (in)equations.
Example:
for (i = a - 7*b + 8; i <= 3*a + 13*b + 20; i++)
for (j = 2; j <= 2*i + 5; j++)
for (k = 0; k <= 5; k++)
S (i,j,k)
Loop iterators: i, j, k
Parameters: a, b
(I)eq i j k a b 1
1 1 0 0 -1 7 -8 # i >= a - 7b + 8
1 -1 0 0 3 13 20 # i <= 3a + 13b + 20
1 0 1 0 0 0 -2 # j >= 2
1 2 -1 0 0 0 5 # j <= 2i + 5
1 0 0 1 0 0 0 # k >= 0
1 0 0 -1 0 0 5 # k <= 5
The number of loop iterators may change and is not connected to the
number of loops, that surrounded this bb in the gimple code. */
CloogMatrix *domain;
/* Lists containing the restrictions of the conditional statements
dominating this bb. This bb can only be executed, if all conditions
are true.
Example:
for (i = 0; i <= 20; i++)
{
A
if (2i <= 8)
B
}
So for B there is an additional condition (2i <= 8).
TODO: Add these restrictions to the domain matrix.
List of COND_EXPR and SWITCH_EXPR. A COND_EXPR is true only if the
corresponding element in CONDITION_CASES is not NULL_TREE. For a
SWITCH_EXPR the corresponding element in CONDITION_CASES is a
CASE_LABEL_EXPR. */
VEC (gimple, heap) *conditions;
VEC (gimple, heap) *condition_cases;
/* LOOPS contains for every column in the graphite domain the corresponding
gimple loop. If there exists no corresponding gimple loop LOOPS contains
NULL.
Example:
Original code:
for (i = 0; i <= 20; i++)
for (j = 5; j <= 10; j++)
A
Original domain:
(I)eq i j 1
1 1 0 0 # i >= 0
1 -1 0 20 # i <= 20
1 0 1 0 # j >= 0
1 0 -1 10 # j <= 10
Original loops vector:
0 1
Loop i Loop j
After some changes (Exchange i and j, strip-mine i):
Domain:
(I)eq j ii i k 1
1 0 0 1 0 0 # i >= 0
1 0 0 -1 0 20 # i <= 20
1 1 0 0 0 0 # j >= 0
1 -1 0 0 0 10 # j <= 10
1 0 -1 1 0 0 # ii <= i
1 0 1 -1 0 1 # ii + 1 >= i
1 0 -1 0 2 0 # ii <= 2k
1 0 1 0 -2 0 # ii >= 2k
Iterator vector:
0 1 2 3
Loop j NULL Loop i NULL
Means the original loop i is now at column two of the domain and
loop j in the original loop nest is now at column 0. Column 1 and
3 are emtpy. */
VEC (loop_p, heap) *loops;
lambda_vector compressed_alpha_matrix;
CloogMatrix *dynamic_schedule;
VEC (data_reference_p, heap) *data_refs;
htab_t cloog_iv_types;
} *gbb_p;
#define GBB_BB(GBB) GBB->bb
#define GBB_SCOP(GBB) GBB->scop
#define GBB_STATIC_SCHEDULE(GBB) GBB->static_schedule
#define GBB_DATA_REFS(GBB) GBB->data_refs
#define GBB_ALPHA(GBB) GBB->compressed_alpha_matrix
#define GBB_DYNAMIC_SCHEDULE(GBB) GBB->dynamic_schedule
#define GBB_DOMAIN(GBB) GBB->domain
#define GBB_CONDITIONS(GBB) GBB->conditions
#define GBB_CONDITION_CASES(GBB) GBB->condition_cases
#define GBB_LOOPS(GBB) GBB->loops
#define GBB_CLOOG_IV_TYPES(GBB) GBB->cloog_iv_types
/* Return the loop that contains the basic block GBB. */
static inline struct loop *
gbb_loop (struct graphite_bb *gbb)
{
return GBB_BB (gbb)->loop_father;
}
int nb_loops_around_gb (graphite_bb_p);
/* Calculate the number of loops around GB in the current SCOP. Only
works if GBB_DOMAIN is built. */
static inline int
gbb_nb_loops (const struct graphite_bb *gb)
{
scop_p scop = GBB_SCOP (gb);
if (GBB_DOMAIN (gb) == NULL)
return 0;
return GBB_DOMAIN (gb)->NbColumns - scop_nb_params (scop) - 2;
}
/* Returns the gimple loop, that corresponds to the loop_iterator_INDEX.
If there is no corresponding gimple loop, we return NULL. */
static inline loop_p
gbb_loop_at_index (graphite_bb_p gb, int index)
{
return VEC_index (loop_p, GBB_LOOPS (gb), index);
}
/* Returns the index of LOOP in the loop nest around GB. */
static inline int
gbb_loop_index (graphite_bb_p gb, loop_p loop)
{
int i;
loop_p l;
for (i = 0; VEC_iterate (loop_p, GBB_LOOPS (gb), i, l); i++)
if (loop == l)
return i;
gcc_unreachable();
}
struct loop_to_cloog_loop_str
{
unsigned int loop_num;
unsigned int loop_position; /* The column that represents this loop. */
CloogLoop *cloog_loop;
};
typedef struct name_tree_d
{
tree t;
const char *name;
struct loop *loop;
} *name_tree;
DEF_VEC_P(name_tree);
DEF_VEC_ALLOC_P (name_tree, heap);
/* A Single Entry, Single Exit region is a part of the CFG delimited
by two edges. */
typedef struct sese_d
{
/* Single ENTRY and single EXIT from the SESE region. */
edge entry, exit;
/* REGION_BASIC_BLOCKS contains the set of all the basic blocks
belonging to the SESE region. */
struct pointer_set_t *region_basic_blocks;
/* An SSA_NAME version is flagged in the LIVEOUT bitmap if the
SSA_NAME is defined inside and used outside the SESE region. */
bitmap liveout;
/* The overall number of SSA_NAME versions used to index LIVEIN. */
int num_ver;
/* For each SSA_NAME version VER in LIVEOUT, LIVEIN[VER] contains
the set of basic blocks indices that contain a use of VER. */
bitmap *livein;
} *sese;
#define SESE_ENTRY(S) (S->entry)
#define SESE_EXIT(S) (S->exit)
#define SESE_REGION_BBS(S) (S->region_basic_blocks)
#define SESE_LIVEOUT(S) (S->liveout)
#define SESE_LIVEIN(S) (S->livein)
#define SESE_LIVEIN_VER(S, I) (S->livein[I])
#define SESE_NUM_VER(S) (S->num_ver)
extern sese new_sese (edge, edge);
extern void free_sese (sese);
extern void sese_build_livein_liveouts (sese);
/* A SCOP is a Static Control Part of the program, simple enough to be
represented in polyhedral form. */
struct scop
{
/* A SCOP is defined as a SESE region. */
sese region;
/* All the basic blocks in this scop that contain memory references
and that will be represented as statements in the polyhedral
representation. */
VEC (graphite_bb_p, heap) *bbs;
lambda_vector static_schedule;
/* Parameters used within the SCOP. */
VEC (name_tree, heap) *params;
/* A collection of old induction variables*/
VEC (name_tree, heap) *old_ivs;
/* Loops completely contained in the SCOP. */
bitmap loops;
VEC (loop_p, heap) *loop_nest;
/* ??? It looks like a global mapping loop_id -> cloog_loop would work. */
htab_t loop2cloog_loop;
/* Cloog representation of this scop. */
CloogProgram *program;
/* Are we allowed to add more params? This is for debugging purpose. We
can only add new params before generating the bb domains, otherwise they
become invalid. */
bool add_params;
/* LIVEOUT_RENAMES registers the rename mapping that has to be
applied after code generation. */
htab_t liveout_renames;
};
#define SCOP_BBS(S) S->bbs
#define SCOP_REGION(S) S->region
/* SCOP_ENTRY bb dominates all the bbs of the scop. SCOP_EXIT bb
post-dominates all the bbs of the scop. SCOP_EXIT potentially
contains non affine data accesses, side effect statements or
difficult constructs, and thus is not considered part of the scop,
but just a boundary. SCOP_ENTRY is considered part of the scop. */
#define SCOP_ENTRY(S) (SESE_ENTRY (SCOP_REGION (S))->dest)
#define SCOP_EXIT(S) (SESE_EXIT (SCOP_REGION (S))->dest)
#define SCOP_REGION_BBS(S) (SESE_REGION_BBS (SCOP_REGION (S)))
#define SCOP_STATIC_SCHEDULE(S) S->static_schedule
#define SCOP_LOOPS(S) S->loops
#define SCOP_LOOP_NEST(S) S->loop_nest
#define SCOP_ADD_PARAMS(S) S->add_params
#define SCOP_PARAMS(S) S->params
#define SCOP_OLDIVS(S) S->old_ivs
#define SCOP_PROG(S) S->program
#define SCOP_LOOP2CLOOG_LOOP(S) S->loop2cloog_loop
#define SCOP_LOOPS_MAPPING(S) S->loops_mapping
#define SCOP_LIVEOUT_RENAMES(S) S->liveout_renames
extern void debug_scop (scop_p, int);
extern void debug_scops (int);
extern void print_graphite_bb (FILE *, graphite_bb_p, int, int);
extern void debug_gbb (graphite_bb_p, int);
extern void dot_scop (scop_p);
extern void dot_all_scops (void);
extern void debug_clast_stmt (struct clast_stmt *);
extern void debug_rename_map (htab_t);
extern void debug_ivtype_map (htab_t);
extern void debug_loop_vec (graphite_bb_p);
extern void debug_oldivs (scop_p);
/* Describes the type of an iv stack entry. */
typedef enum {
iv_stack_entry_unknown = 0,
iv_stack_entry_iv,
iv_stack_entry_const
} iv_stack_entry_kind;
/* Data contained in an iv stack entry. */
typedef union iv_stack_entry_data_union
{
name_tree iv;
tree constant;
} iv_stack_entry_data;
/* Datatype for loop iv stack entry. */
typedef struct iv_stack_entry_struct
{
iv_stack_entry_kind kind;
iv_stack_entry_data data;
} iv_stack_entry;
typedef iv_stack_entry *iv_stack_entry_p;
DEF_VEC_P(iv_stack_entry_p);
DEF_VEC_ALLOC_P(iv_stack_entry_p,heap);
typedef VEC(iv_stack_entry_p, heap) **loop_iv_stack;
extern void debug_loop_iv_stack (loop_iv_stack);
/* Return the old induction variable of the LOOP that is in normal
form in SCOP. */
static inline tree
oldiv_for_loop (scop_p scop, loop_p loop)
{
int i;
name_tree iv;
if (!loop)
return NULL_TREE;
for (i = 0; VEC_iterate (name_tree, SCOP_OLDIVS (scop), i, iv); i++)
if (iv->loop == loop)
return iv->t;
return NULL_TREE;
}
/* Return the number of gimple loops contained in SCOP. */
static inline int
scop_nb_loops (scop_p scop)
{
return VEC_length (loop_p, SCOP_LOOP_NEST (scop));
}
/* Returns the number of parameters for SCOP. */
static inline unsigned
scop_nb_params (scop_p scop)
{
return VEC_length (name_tree, SCOP_PARAMS (scop));
}
/* Return the dimension of the domains for SCOP. */
static inline int
scop_dim_domain (scop_p scop)
{
return scop_nb_loops (scop) + scop_nb_params (scop) + 1;
}
/* Return the dimension of the domains for GB. */
static inline int
gbb_dim_domain (graphite_bb_p gb)
{
return scop_dim_domain (GBB_SCOP (gb));
}
/* Returns the dimensionality of a loop iteration domain for a given
loop, identified by LOOP_NUM, with respect to SCOP. */
static inline int
loop_domain_dim (unsigned int loop_num, scop_p scop)
{
struct loop_to_cloog_loop_str tmp, *slot;
htab_t tab = SCOP_LOOP2CLOOG_LOOP (scop);
tmp.loop_num = loop_num;
slot = (struct loop_to_cloog_loop_str *) htab_find (tab, &tmp);
/* The loop containing the entry of the scop is not always part of
the SCoP, and it is not registered in SCOP_LOOP2CLOOG_LOOP. */
if (!slot)
return scop_nb_params (scop) + 2;
return cloog_domain_dim (cloog_loop_domain (slot->cloog_loop)) + 2;
}
/* Returns the dimensionality of a loop iteration vector in a loop
iteration domain for a given loop (identified by LOOP_NUM) with
respect to SCOP. */
static inline int
loop_iteration_vector_dim (unsigned int loop_num, scop_p scop)
{
return loop_domain_dim (loop_num, scop) - 2 - scop_nb_params (scop);
}
/* Checks, if SCOP contains LOOP. */
static inline bool
scop_contains_loop (scop_p scop, struct loop *loop)
{
return bitmap_bit_p (SCOP_LOOPS (scop), loop->num);
}
/* Returns the index of LOOP in the domain matrix for the SCOP. */
static inline int
scop_loop_index (scop_p scop, struct loop *loop)
{
unsigned i;
struct loop *l;
gcc_assert (scop_contains_loop (scop, loop));
for (i = 0; VEC_iterate (loop_p, SCOP_LOOP_NEST (scop), i, l); i++)
if (l == loop)
return i;
gcc_unreachable();
}
/* Return the index of innermost loop that contains the basic block
GBB. */
static inline int
gbb_inner_most_loop_index (scop_p scop, graphite_bb_p gb)
{
return scop_loop_index(scop, gbb_loop (gb));
}
/* Return the outermost loop that contains the loop LOOP. The outer
loops are searched until a sibling for the outer loop is found. */
static struct loop *
outer_most_loop_1 (scop_p scop, struct loop* loop, struct loop* current_outer)
{
return (!scop_contains_loop (scop, loop)) ? current_outer :
(loop->next != NULL) ? loop :
outer_most_loop_1 (scop, loop_outer (loop), loop);
}
/* Return the outermost loop that contains the loop LOOP. */
static struct loop *
outer_most_loop (scop_p scop, struct loop *loop)
{
return outer_most_loop_1 (scop, loop, NULL);
}
/* Return the index of the outermost loop that contains the basic
block BB. */
static inline int
gbb_outer_most_loop_index (scop_p scop, graphite_bb_p gb)
{
return scop_loop_index (scop, outer_most_loop (scop, gbb_loop (gb)));
}
/* Return the loop depth of LOOP in SCOP. */
static inline unsigned int
scop_gimple_loop_depth (scop_p scop, loop_p loop)
{
unsigned int depth = 0;
loop = loop_outer (loop);
while (scop_contains_loop (scop, loop))
{
depth++;
loop = loop_outer (loop);
}
return depth;
}
#endif /* GCC_GRAPHITE_H */ #endif /* GCC_GRAPHITE_H */
...@@ -658,6 +658,11 @@ init_optimization_passes (void) ...@@ -658,6 +658,11 @@ init_optimization_passes (void)
NEXT_PASS (pass_loop_distribution); NEXT_PASS (pass_loop_distribution);
NEXT_PASS (pass_linear_transform); NEXT_PASS (pass_linear_transform);
NEXT_PASS (pass_graphite_transforms); NEXT_PASS (pass_graphite_transforms);
{
struct opt_pass **p = &pass_graphite_transforms.pass.sub;
NEXT_PASS (pass_dce_loop);
NEXT_PASS (pass_lim);
}
NEXT_PASS (pass_iv_canon); NEXT_PASS (pass_iv_canon);
NEXT_PASS (pass_if_conversion); NEXT_PASS (pass_if_conversion);
NEXT_PASS (pass_vectorize); NEXT_PASS (pass_vectorize);
......
...@@ -1801,7 +1801,8 @@ process_options (void) ...@@ -1801,7 +1801,8 @@ process_options (void)
|| flag_loop_block || flag_loop_block
|| flag_loop_interchange || flag_loop_interchange
|| flag_loop_strip_mine || flag_loop_strip_mine
|| flag_graphite_identity) || flag_graphite_identity
|| flag_graphite_force_parallel)
sorry ("Graphite loop optimizations cannot be used"); sorry ("Graphite loop optimizations cannot be used");
#endif #endif
...@@ -2046,7 +2047,7 @@ process_options (void) ...@@ -2046,7 +2047,7 @@ process_options (void)
if (flag_signaling_nans) if (flag_signaling_nans)
flag_trapping_math = 1; flag_trapping_math = 1;
/* We cannot reassociate if we want traps or signed zeros.  */ /* We cannot reassociate if we want traps or signed zeros. */
if (flag_associative_math && (flag_trapping_math || flag_signed_zeros)) if (flag_associative_math && (flag_trapping_math || flag_signed_zeros))
{ {
warning (0, "-fassociative-math disabled; other options take precedence"); warning (0, "-fassociative-math disabled; other options take precedence");
......
...@@ -36,6 +36,7 @@ along with GCC; see the file COPYING3. If not see ...@@ -36,6 +36,7 @@ along with GCC; see the file COPYING3. If not see
#include "flags.h" #include "flags.h"
#include "tree-inline.h" #include "tree-inline.h"
#include "tree-scalar-evolution.h" #include "tree-scalar-evolution.h"
#include "toplev.h"
#include "tree-vectorizer.h" #include "tree-vectorizer.h"
/* The loop superpass. */ /* The loop superpass. */
...@@ -307,9 +308,12 @@ gate_graphite_transforms (void) ...@@ -307,9 +308,12 @@ gate_graphite_transforms (void)
/* Enable -fgraphite pass if any one of the graphite optimization flags /* Enable -fgraphite pass if any one of the graphite optimization flags
is turned on. */ is turned on. */
if (flag_loop_block || flag_loop_interchange || flag_loop_strip_mine if (flag_loop_block || flag_loop_interchange || flag_loop_strip_mine
|| flag_graphite_identity) || flag_graphite_identity || flag_graphite_force_parallel)
flag_graphite = 1; flag_graphite = 1;
if (flag_loop_block)
sorry ("loop blocking not implemented");
return flag_graphite != 0; return flag_graphite != 0;
} }
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment