00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032
00033
00034
00035
00036
00037
00038
00039
00040
00041
00042
00043
00044
00045
00046
00052 #ifndef AUTOD_DECLARE
00053
00054 #define AUTOD_DECLARE
00055
00056
00057 #include <sys/types.h>
00058 #ifndef lnopt_main_INCLUDED
00059 #include "lnopt_main.h"
00060 #endif
00061 #ifndef lnoutils_INCLUDED
00062 #include "lnoutils.h"
00063 #endif
00064 #ifndef lwn_util_INCLUDED
00065 #include "lwn_util.h"
00066 #endif
00067 #ifndef _lno_bv_INCLUDED
00068 #include "lno_bv.h"
00069 #endif
00070 #ifndef bin_tree_INCLUDED
00071 #include "btree.h"
00072 #endif
00073 #ifndef cxx_graph_INCLUDED
00074 #include "cxx_graph.h"
00075 #endif
00076 #ifndef graph_template_INCLUDED
00077 #include "graph_template.h"
00078 #endif
00079
00080
00081 void Automatic_Data_Distribute(WN *wn);
00082 void Transpose_For_MP(WN *wn);
00083
00084
00085 class ARRAY_DESCRIPTOR
00086 {
00087 mBOOL _is_bad;
00088 BIT_VECTOR *_parallel_dims;
00089 ST *_st;
00090
00091 public:
00092 BOOL Is_Bad() const { return _is_bad; };
00093 BOOL operator <(const ARRAY_DESCRIPTOR &array) const {
00094 return (_st < array._st);
00095 }
00096 BOOL operator >(const ARRAY_DESCRIPTOR &array) const {
00097 return (_st > array._st);
00098 }
00099 BOOL operator ==(const ARRAY_DESCRIPTOR &array) const {
00100 return (_st == array._st);
00101 }
00102 ARRAY_DESCRIPTOR &operator=(const ARRAY_DESCRIPTOR &array) {
00103 _st = array._st;
00104 _is_bad = array._is_bad;
00105 _parallel_dims = array._parallel_dims;
00106 return *this;
00107 }
00108 ARRAY_DESCRIPTOR() {;};
00109 ARRAY_DESCRIPTOR(ST *st, BIT_VECTOR *parallel_dims, BOOL is_bad) {
00110 _st = st;
00111 _parallel_dims = parallel_dims;
00112 _is_bad = is_bad;
00113 }
00114 void Union(ARRAY_DESCRIPTOR *ad) {
00115 if (_is_bad) return;
00116 if (ad->_is_bad || !(*_parallel_dims == *ad->_parallel_dims)) {
00117 _is_bad = TRUE;
00118 }
00119 }
00120 void Set_Bad() { _is_bad=TRUE; };
00121 void Distribute_Array(WN *insertion_point);
00122 };
00123
00124 typedef BINARY_TREE<ARRAY_DESCRIPTOR> ARRAY_DESCR_TREE;
00125 typedef STACK<ST *> ARRAY_DESCR_STACK;
00126
00127 class DISTRIBUTION
00128 {
00129 ARRAY_DESCR_TREE *_locals;
00130 ARRAY_DESCR_TREE *_globals;
00131 ARRAY_DESCR_STACK *_locals_stack;
00132 ARRAY_DESCR_STACK *_globals_stack;
00133 MEM_POOL *_pool;
00134 WN *_preamble;
00135 enum {epsilon = 5};
00136 void Gather_Arrays(WN *wn, BOOL seen_mp);
00137 void Process_Memory(WN *wn);
00138 void Distribute_Arrays();
00139 DOLOOP_STACK *_do_stack;
00140 public:
00141 DISTRIBUTION(WN *wn, MEM_POOL *pool);
00142 };
00143
00144
00145
00146 #define TRANSPOSE_MAX_SIZE 16
00147
00148
00149
00150 class ARRAY_TRANSPOSE_DESCRIPTOR
00151 {
00152 ST *_st;
00153 INT _dimension;
00154 VINDEX16 _vertex;
00155 mBOOL _transposable;
00156 public:
00157
00158 BOOL operator <(const ARRAY_TRANSPOSE_DESCRIPTOR &array) const {
00159 return (_st < array._st);
00160 }
00161 BOOL operator >(const ARRAY_TRANSPOSE_DESCRIPTOR &array) const {
00162 return (_st > array._st);
00163 }
00164 BOOL operator ==(const ARRAY_TRANSPOSE_DESCRIPTOR &array) const {
00165 return (_st == array._st);
00166 }
00167 ARRAY_TRANSPOSE_DESCRIPTOR &operator=(const ARRAY_TRANSPOSE_DESCRIPTOR &array) {
00168 _st = array._st;
00169 _vertex = array._vertex;
00170 _transposable = array._transposable;
00171 _dimension = array._dimension;
00172 return *this;
00173 }
00174 ARRAY_TRANSPOSE_DESCRIPTOR(ST *st) {
00175 _st = st;
00176 _transposable = TRUE;
00177 _vertex = 0;
00178 _dimension = -1;
00179 }
00180 ARRAY_TRANSPOSE_DESCRIPTOR(ST *st, BOOL transposable) {
00181 _st = st;
00182 _transposable = transposable;
00183 _vertex = 0;
00184 _dimension = -1;
00185 }
00186 ARRAY_TRANSPOSE_DESCRIPTOR() {;};
00187 VINDEX16 Get_Vertex() { return _vertex; };
00188 void Set_Vertex(INT i) { _vertex=i; };
00189 INT Get_Dimension() { return _dimension; };
00190 void Set_Dimension(INT value) { _dimension=value; };
00191 void Set_Transposable() { _transposable = TRUE; };
00192 void Reset_Transposable() { _transposable = FALSE; };
00193 BOOL Transposable() { return _transposable; };
00194 };
00195
00196 typedef BINARY_TREE<ARRAY_TRANSPOSE_DESCRIPTOR> ARRAY_TRANSPOSE_TREE;
00197
00198
00199 class TVERTEX : public VERTEX16
00200 {
00201 public:
00202 INT size;
00203 INT value;
00204
00205 BOOL is_loop;
00206 union {
00207 WN *inner_loop;
00208 ST *st;
00209 } tvertex_union;
00210 TVERTEX(WN *wn, INT size) { tvertex_union.inner_loop = wn; size = size; is_loop = TRUE; }
00211 TVERTEX(ST *st, INT size) { tvertex_union.st = st; size = size; is_loop = FALSE; }
00212 mBOOL can_be_parallel[TRANSPOSE_MAX_SIZE];
00213 friend class TRANSPOSE_DIRECTED_GRAPH16;
00214 };
00215
00216
00217
00218
00219
00220 class TEDGE : public EDGE16
00221 {
00222 public:
00223 INT constraint[TRANSPOSE_MAX_SIZE];
00224 TEDGE() { ; };
00225 friend class TRANSPOSE_DIRECTED_GRAPH16;
00226 };
00227
00228 class TRANSPOSE_DIRECTED_GRAPH16: public DIRECTED_GRAPH16<TEDGE,TVERTEX> {
00229 BOOL Outermore_Parallelizable(WN *wn);
00230 BOOL Contains_Parallelizable(WN *wn,INT nloops);
00231 BOOL _is_bad;
00232 void Gather_Arrays(WN *wn,ARRAY_TRANSPOSE_TREE *arrays);
00233 BOOL IO_element_read(WN *item);
00234 void Build_Snl(WN *inner, INT nloops, ARRAY_TRANSPOSE_TREE *arrays);
00235 void Build_Snl_Arrays(WN *outer, ARRAY_TRANSPOSE_TREE *arrays,
00236 INT outer_depth,INT inner_depth,VINDEX16 snl_v);
00237 void Build_Snl_Array(WN *array, ARRAY_TRANSPOSE_TREE *arrays,
00238 INT outer_depth,INT inner_depth,VINDEX16 snl_v);
00239 BOOL Local_Array(ST *st);
00240 BOOL Propogate_V(VINDEX16 v);
00241 void Clear_Values();
00242 VINDEX16 Get_Loop_Vertex();
00243 BOOL _did_transpose;
00244 void Record(ARRAY_TRANSPOSE_TREE *arrays);
00245 public:
00246 TRANSPOSE_DIRECTED_GRAPH16( mUINT16 num_v, mUINT16 num_e) :
00247 DIRECTED_GRAPH16<TEDGE,TVERTEX>(num_v,num_e) {
00248 _is_bad = FALSE;
00249 _did_transpose = FALSE;
00250 }
00251 BOOL Did_Transpose() { return _did_transpose; };
00252 void Transpose(WN *wn,ARRAY_TRANSPOSE_TREE *arrays);
00253 void Transpose_Array(WN *array, INT dim);
00254 void Transpose_Array(ST *st, INT dim);
00255 void Build(WN *wn,ARRAY_TRANSPOSE_TREE *arrays);
00256 void Solve(ARRAY_TRANSPOSE_TREE *arrays);
00257
00258 EINDEX16 Add_Edge(VINDEX16 from, VINDEX16 to, INT size) {
00259 EINDEX16 result = DIRECTED_GRAPH16<TEDGE,TVERTEX>::Add_Edge(from,to);
00260 for (INT i=0; i<size; i++) {
00261 _e[result].constraint[i] = -1;
00262 }
00263 return result;
00264 }
00265 void Set_Constraint(EINDEX16 edge,INT index, INT val) {
00266 _e[edge].constraint[index] = val;
00267 }
00268 INT Get_Constraint(EINDEX16 edge,INT index) {
00269 return _e[edge].constraint[index];
00270 }
00271 VINDEX16 Add_Vertex(INT size, WN *loop) {
00272 VINDEX16 result = DIRECTED_GRAPH16<TEDGE,TVERTEX>::Add_Vertex();
00273 _v[result].tvertex_union.inner_loop = loop;
00274 _v[result].size = size;
00275 _v[result].is_loop = TRUE;
00276 return result;
00277 }
00278 VINDEX16 Add_Vertex(INT size, ST *st) {
00279 VINDEX16 result = DIRECTED_GRAPH16<TEDGE,TVERTEX>::Add_Vertex();
00280 _v[result].tvertex_union.st = st;
00281 _v[result].size = size;
00282 _v[result].is_loop = FALSE;
00283 return result;
00284 }
00285 mBOOL Can_Be_Parallel(VINDEX16 v, INT i) {
00286 return _v[v].can_be_parallel[i];
00287 }
00288 void Set_Can_Be_Parallel(VINDEX16 v, INT i) {
00289 _v[v].can_be_parallel[i]=TRUE;
00290 }
00291 void Reset_Can_Be_Parallel(VINDEX16 v, INT i) {
00292 _v[v].can_be_parallel[i]=FALSE;
00293 }
00294 void Print(FILE *fp);
00295
00296 };
00297
00298
00299 #endif // AUTOD_DECLARE
00300