00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032
00033
00034
00035
00036 #ifdef USE_PCH
00037 #include "lno_pch.h"
00038 #endif // USE_PCH
00039 #pragma hdrstop
00040
00041 #include <sys/types.h>
00042
00043 #include "lnoutils.h"
00044 #include "lnopt_main.h"
00045 #include "stab.h"
00046 #include "targ_const.h"
00047 #include "wn_simp.h"
00048 #include "stdlib.h"
00049 #include "lwn_util.h"
00050 #include "strtab.h"
00051 #include "config.h"
00052 #include "optimizer.h"
00053 #include "opt_du.h"
00054 #include "name.h"
00055 #include "wintrinsic.h"
00056 #include "lno_bv.h"
00057 #include "dep_graph.h"
00058 #include "debug.h"
00059 #include "cxx_memory.h"
00060 #include "move.h"
00061 #include "snl_utils.h"
00062 #include "access_vector.h"
00063 #include "array_bounds.h"
00064 #include "soe.h"
00065 #include "cond.h"
00066 #include "tlog.h"
00067 #include "fiz_fuse.h"
00068 #include "forward.h"
00069 #include "prompf.h"
00070
00071 #include "ir_reader.h"
00072
00073
00074
00075
00076
00077
00078 extern void Remove_Zero_Trip_Loop(WN* wn_loop)
00079 {
00080
00081 if (Is_Nested_Doacross(wn_loop)) {
00082 DevWarn("Attempted removing one loop out of a nested doacross");
00083 return;
00084 }
00085
00086 if (LNO_Verbose) {
00087 fprintf(stdout, "Removing Zero Trip Loop on line %d\n",
00088 (INT) WN_linenum(wn_loop));
00089 fprintf(TFile, "Removing Zero Trip Loop on line %d\n",
00090 (INT) WN_linenum(wn_loop));
00091 }
00092 if (LNO_Tlog)
00093 Generate_Tlog("LNO", "trip_count", Srcpos_To_Line(WN_linenum(wn_loop)),
00094 (char *) WB_Whirl_Symbol(wn_loop), "", "", "zero-trip");
00095 FmtAssert(Iterations(wn_loop, &LNO_local_pool) == 0,
00096 ("Loop is not zero trip."));
00097 WN* wn_asg = WN_start(wn_loop);
00098 if (Index_Variable_Live_At_Exit(wn_loop)) {
00099 LWN_Insert_Block_Before(LWN_Get_Parent(wn_loop), wn_loop,
00100 WN_start(wn_loop));
00101 WN_start(wn_loop) = NULL;
00102 }
00103 LWN_Extract_From_Block(wn_loop);
00104 LWN_Delete_Tree(wn_loop);
00105 }
00106
00107
00108
00109
00110
00111
00112
00113 static void Remove_Unity_Trip_Loop_Loop_Stmt_Update(WN* wn_loop,
00114 DU_MANAGER* du)
00115 {
00116 LWN_ITER* itr = LWN_WALK_TreeIter(WN_do_body(wn_loop));
00117 WN* replace_with = LWN_Get_Parent(wn_loop);
00118 while (replace_with && WN_opcode(replace_with) != OPC_DO_LOOP)
00119 replace_with = LWN_Get_Parent(replace_with);
00120 for ( ; itr; itr = LWN_WALK_TreeNext(itr)) {
00121 WN* wn = itr->wn;
00122 OPERATOR opr = WN_operator(wn);
00123 DEF_LIST *def_list = du->Ud_Get_Def(wn);
00124 if (def_list) {
00125 if (def_list->Loop_stmt() == wn_loop) {
00126 du->Ud_Get_Def(wn)->Set_loop_stmt(replace_with);
00127 }
00128 }
00129 }
00130 }
00131
00132
00133
00134
00135
00136
00137
00138 extern void Remove_Unity_Trip_Loop_Dep_Update(WN* wn_loop,
00139 ARRAY_DIRECTED_GRAPH16* dg,
00140 BOOL will_not_remove_loop)
00141 {
00142 for (LWN_ITER *iter = LWN_WALK_TreeIter(WN_do_body(wn_loop));
00143 iter; iter = LWN_WALK_TreeNext(iter)) {
00144 WN* wn = iter->wn;
00145 OPCODE op = WN_opcode(wn);
00146 if (!OPCODE_is_load(op) && !OPCODE_is_store(op) && !OPCODE_is_call(op))
00147 continue;
00148 VINDEX16 v = dg->Get_Vertex(wn);
00149 if (v == 0)
00150 continue;
00151
00152
00153
00154
00155 INT do_depth = Block_Loop_Depth(wn);
00156 FmtAssert(do_depth >= 0, ("this vertex must be inside a loop!"));
00157 if (do_depth == 0) {
00158 EINDEX16 e;
00159 EINDEX16 enext = 0;
00160 for (e = dg->Get_In_Edge(v); e; e = enext) {
00161 enext = dg->Get_Next_In_Edge(e);
00162 dg->Delete_Array_Edge(e);
00163 }
00164 for (e = dg->Get_Out_Edge(v); e; e = enext) {
00165 enext = dg->Get_Next_Out_Edge(e);
00166 dg->Delete_Array_Edge(e);
00167 }
00168 dg->Delete_Vertex(v);
00169 continue;
00170 }
00171
00172
00173
00174 EINDEX16 e_next = 0;
00175 for (EINDEX16 e = dg->Get_Out_Edge(v); e; e = e_next) {
00176 e_next = dg->Get_Next_Out_Edge(e);
00177 VINDEX16 vSink = dg->Get_Sink(e);
00178 WN* wnSink = dg->Get_Wn(vSink);
00179 if (!Wn_Is_Inside(wnSink, WN_do_body(wn_loop)))
00180 continue;
00181 DEPV_ARRAY* dva = dg->Depv_Array(e);
00182 INT wd_component = Do_Loop_Depth(wn_loop) - dva->Num_Unused_Dim();
00183 if (wd_component >= 0) {
00184 FmtAssert(wd_component < dva->Num_Dim(),
00185 ("Bad indexing into dependence vector."));
00186
00187
00188 INT dva_new_num_vec = 0;
00189 for (INT i = 0; i < dva->Num_Vec(); i++) {
00190 DEPV* dv = dva->Depv(i);
00191 if (DEP_Direction(DEPV_Dep(dv, wd_component)) & DIR_EQ)
00192 dva_new_num_vec++;
00193 }
00194
00195 if (dva_new_num_vec > 0) {
00196 mUINT8 new_unused_dim=dva->Num_Unused_Dim();
00197 if (will_not_remove_loop)
00198 new_unused_dim++;
00199 DEPV_ARRAY* dva_new = Create_DEPV_ARRAY(dva_new_num_vec,
00200 dva->Num_Dim() - 1, new_unused_dim, dg->Pool());
00201 INT j = 0;
00202 for (INT i = 0; i < dva->Num_Vec(); i++) {
00203 DEPV* dv = dva->Depv(i);
00204 if (!(DEP_Direction(DEPV_Dep(dv, wd_component)) & DIR_EQ))
00205 continue;
00206 DEPV* dv_new = dva_new->Depv(j++);
00207 INT dnew = 0;
00208 for (INT dold = 0; dold < dva->Num_Dim(); dold++) {
00209 if (dold == wd_component)
00210 continue;
00211 FmtAssert(dnew >= 0 && dnew < dva_new->Num_Dim(),
00212 ("Bad indexing into dependence vector."));
00213 DEPV_Dep(dv_new, dnew++) = DEPV_Dep(dv, dold);
00214 }
00215 }
00216 Delete_DEPV_ARRAY(dva, dg->Pool());
00217 dg->Set_Depv_Array(e, dva_new);
00218 } else {
00219 dg->Delete_Array_Edge(e);
00220 }
00221 } else if (!will_not_remove_loop) {
00222
00223
00224 dva->Set_Num_Unused_Dim(dva->Num_Unused_Dim()-1);
00225 }
00226 }
00227 }
00228 }
00229
00230
00231
00232
00233
00234
00235
00236
00237 static void Remove_Unity_Trip_Loop_Update_If_Accesses(WN* wn_parent)
00238 {
00239 for (WN* wn = wn_parent; wn != NULL; wn = LWN_Get_Parent(wn)) {
00240 if (WN_opcode(wn) == OPC_DO_LOOP)
00241 return;
00242 if (WN_opcode(wn) == OPC_IF) {
00243 LWN_ITER* itr = LWN_WALK_TreeIter(wn);
00244 for (; itr != NULL; itr = LWN_WALK_TreeNext(itr))
00245 if (WN_opcode(itr->wn) == OPC_DO_LOOP)
00246 break;
00247 BOOL has_do_loops = itr != NULL;
00248 IF_INFO* ii = Get_If_Info(wn);
00249 ii->Contains_Do_Loops = has_do_loops;
00250 }
00251 }
00252 }
00253
00254
00255
00256
00257
00258
00259
00260 static void Remove_Unity_Trip_Loop_Update_Is_Inner(WN* wn_parent)
00261 {
00262 WN* wn = 0;
00263 for (wn = wn_parent; wn != NULL; wn = LWN_Get_Parent(wn))
00264 if (WN_opcode(wn) == OPC_DO_LOOP)
00265 break;
00266 if (wn == NULL)
00267 return;
00268 WN* wn_loop = wn;
00269 LWN_ITER* itr = LWN_WALK_TreeIter(WN_do_body(wn_loop));
00270 for (; itr != NULL; itr = LWN_WALK_TreeNext(itr))
00271 if (WN_opcode(itr->wn) == OPC_DO_LOOP)
00272 break;
00273 if (itr != NULL)
00274 return;
00275 DO_LOOP_INFO* dli = Get_Do_Loop_Info(wn_loop);
00276 dli->Is_Inner = TRUE;
00277 }
00278
00279
00280
00281
00282
00283
00284
00285
00286 static void Decrement_Loop_Depths(WN* wn_loop)
00287 {
00288 if (WN_opcode(wn_loop) == OPC_DO_LOOP) {
00289 DO_LOOP_INFO* dli = Get_Do_Loop_Info(wn_loop);
00290 dli->Depth--;
00291 }
00292 if (WN_opcode(wn_loop) == OPC_BLOCK) {
00293 for (WN* wn = WN_first(wn_loop); wn != NULL; wn = WN_next(wn))
00294 Decrement_Loop_Depths(wn);
00295 } else {
00296 for (INT i = 0; i < WN_kid_count(wn_loop); i++)
00297 Decrement_Loop_Depths(WN_kid(wn_loop, i));
00298 }
00299 }
00300
00301
00302
00303
00304
00305
00306
00307
00308
00309 extern void Remove_Unity_Trip_Loop(WN* wn_loop,
00310 BOOL update_access,
00311 WN** wn_first,
00312 WN** wn_last,
00313 ARRAY_DIRECTED_GRAPH16* dg,
00314 DU_MANAGER* du)
00315 {
00316
00317 if (Is_Nested_Doacross(wn_loop)) {
00318 DevWarn("Attempted removing one loop out of a nested doacross");
00319 *wn_first = wn_loop;
00320 *wn_last = wn_loop;
00321 return;
00322 }
00323
00324
00325 if (Index_Variable_Live_At_Exit(wn_loop)) {
00326 DO_LOOP_INFO* dli = Get_Do_Loop_Info(wn_loop);
00327 FmtAssert(dli != NULL, ("Remove_Unity_Trip_Loop: No DO_LOOP_INFO"));
00328 if (dli->Has_Gotos) {
00329 WN* wn_copy = LWN_Copy_Tree(WN_start(wn_loop));
00330 LWN_Copy_Def_Use(WN_kid0(WN_start(wn_loop)), WN_kid0(wn_copy), du);
00331 const DU_NODE* node = NULL;
00332 USE_LIST *use_list = du->Du_Get_Use(WN_start(wn_loop));
00333 if (use_list != NULL) {
00334 USE_LIST_ITER iter(use_list);
00335 for (node = iter.First(); !iter.Is_Empty(); node = iter.Next()) {
00336 WN* wn_use = node->Wn();
00337 du->Add_Def_Use(wn_copy, wn_use);
00338 }
00339 if (use_list->Incomplete()) {
00340 USE_LIST* use_list_copy = du->Du_Get_Use(wn_copy);
00341 use_list_copy->Set_Incomplete();
00342 }
00343 }
00344 LWN_Insert_Block_Before(LWN_Get_Parent(wn_loop), wn_loop, wn_copy);
00345 if (dg != NULL) {
00346 if (!dg->Add_Deps_To_Copy_Block(WN_kid0(WN_start(wn_loop)),
00347 WN_kid0(wn_copy), FALSE))
00348 LNO_Erase_Dg_From_Here_In(WN_start(wn_loop), dg);
00349 }
00350 }
00351 Finalize_Index_Variable_For_Remove_Unity_Trip_Loop(wn_loop, TRUE);
00352 }
00353
00354 if (LNO_Verbose) {
00355 fprintf(stdout, "Removing Unity Trip Loop on line %d\n",
00356 (INT) WN_linenum(wn_loop));
00357 fprintf(TFile, "Removing Unity Trip Loop on line %d\n",
00358 (INT) WN_linenum(wn_loop));
00359 }
00360 if (LNO_Tlog)
00361 Generate_Tlog("LNO", "trip_count", Srcpos_To_Line(WN_linenum(wn_loop)),
00362 (char *) WB_Whirl_Symbol(wn_loop), "", "", "unity-trip");
00363
00364
00365
00366 INT64 iter = Iterations(wn_loop, &LNO_local_pool);
00367 FmtAssert((iter == 1) || (iter == -1),
00368 ("Loop not unity trip."));
00369
00370
00371 WN* kid = NULL;
00372 WN* parent = LWN_Get_Parent(wn_loop);
00373 WN *wn_loop_block = WN_do_body(wn_loop);
00374 WN* wd_lower_bound = WN_kid0(WN_start(wn_loop));
00375 BOOL lb_is_const = FALSE;
00376 if (WN_operator(wd_lower_bound) != OPR_INTCONST) {
00377 Replace_Ldid_With_Exp_Copy(WN_index(wn_loop), WN_do_body(wn_loop),
00378 wd_lower_bound, du);
00379 } else {
00380 lb_is_const = TRUE;
00381 }
00382
00383 Remove_Unity_Trip_Loop_Loop_Stmt_Update(wn_loop, du);
00384 if (dg) Remove_Unity_Trip_Loop_Dep_Update(wn_loop, dg, FALSE);
00385 WN* wn_parent = LWN_Get_Parent(wn_loop);
00386
00387
00388 *wn_first = WN_first(wn_loop_block);
00389 *wn_last = WN_last(wn_loop_block);
00390 while ((kid = WN_last(wn_loop_block)) != NULL) {
00391 WN* exkid = LWN_Extract_From_Block(kid);
00392 LWN_Insert_Block_After(parent, wn_loop, exkid);
00393 }
00394
00395 if (lb_is_const) {
00396 WN* lb = LWN_Copy_Tree(WN_start(wn_loop));
00397 WN* tmp = WN_start(wn_loop);
00398 WN_start(wn_loop) = lb;
00399 LWN_Set_Parent(WN_start(wn_loop),wn_loop);
00400 lb = tmp;
00401 LWN_Insert_Block_Before(LWN_Get_Parent(wn_loop),wn_loop,lb);
00402 *wn_first = lb;
00403 if (*wn_last == NULL)
00404 *wn_last = lb;
00405 }
00406
00407
00408 if (Prompf_Info != NULL && Prompf_Info->Is_Enabled()) {
00409 INT old_id = WN_MAP32_Get(Prompf_Id_Map, wn_loop);
00410 Prompf_Info->Remove_Unity_Trip(old_id);
00411 WN_MAP32_Set(Prompf_Id_Map, wn_loop, 0);
00412 }
00413
00414
00415 LWN_Delete_Tree(wn_loop);
00416
00417
00418 if (update_access) {
00419 for (WN* wn = *wn_first; wn != NULL; wn = WN_next(wn)) {
00420 DOLOOP_STACK dostack(&LNO_local_pool);
00421 Build_Doloop_Stack(LWN_Get_Parent(wn), &dostack);
00422 LNO_Build_Access(wn, &dostack, &LNO_default_pool);
00423 if (wn == *wn_last)
00424 break;
00425 }
00426 }
00427
00428
00429 for (WN* wn = *wn_first; wn != NULL; wn = WN_next(wn)) {
00430 Decrement_Loop_Depths(wn);
00431 if (wn == *wn_last)
00432 break;
00433 }
00434
00435
00436 Remove_Unity_Trip_Loop_Update_If_Accesses(wn_parent);
00437 Remove_Unity_Trip_Loop_Update_Is_Inner(wn_parent);
00438
00439 WN *lb = *wn_first;
00440 if (lb && WN_operator(lb) == OPR_STID) {
00441 if (WN_operator(WN_kid0(lb)) == OPR_INTCONST) {
00442 Constant_Propogate(lb,WN_const_val(WN_kid0(lb)));
00443 USE_LIST *uses = Du_Mgr->Du_Get_Use(lb);
00444 if (uses && !uses->Incomplete() && uses->Is_Empty()) {
00445 *wn_first = WN_next(*wn_first);
00446 if (*wn_first == NULL)
00447 *wn_last = NULL;
00448 LWN_Delete_Tree(lb);
00449 }
00450 }
00451 }
00452
00453 }
00454
00455
00456
00457
00458
00459
00460
00461
00462
00463
00464 static BOOL Inner_LB_Is_Outer_Index_Variable(WN* wn_inner_loop,
00465 WN* wn_outer_loop)
00466 {
00467 DO_LOOP_INFO* dli_inner = Get_Do_Loop_Info(wn_inner_loop);
00468 DO_LOOP_INFO* dli_outer = Get_Do_Loop_Info(wn_outer_loop);
00469 ACCESS_ARRAY* aa_inner_lb = dli_inner->LB;
00470 if (Bound_Is_Too_Messy(aa_inner_lb))
00471 return FALSE;
00472 if (aa_inner_lb->Num_Vec() > 1)
00473 return FALSE;
00474 ACCESS_VECTOR* av_inner_lb = aa_inner_lb->Dim(0);
00475 for (INT i = 0; i < av_inner_lb->Nest_Depth(); i++) {
00476 if (i == dli_outer->Depth) {
00477 if (av_inner_lb->Loop_Coeff(i) != (mINT32) 1)
00478 return FALSE;
00479 } else if (i == dli_inner->Depth) {
00480 if (av_inner_lb->Loop_Coeff(i) != (mINT32) -1)
00481 return FALSE;
00482 } else if (av_inner_lb->Loop_Coeff(i) != 0) {
00483 return FALSE;
00484 }
00485 }
00486 if (av_inner_lb->Contains_Lin_Symb() || av_inner_lb->Contains_Non_Lin_Symb())
00487 return FALSE;
00488 if (av_inner_lb->Const_Offset != 0)
00489 return FALSE;
00490 return TRUE;
00491 }
00492
00493
00494
00495
00496
00497
00498
00499
00500
00501
00502 static ACCESS_VECTOR* Inner_LB_Outer_IV_Offset(WN* wn_inner_loop,
00503 WN* wn_outer_loop)
00504 {
00505 DO_LOOP_INFO* dli_inner = Get_Do_Loop_Info(wn_inner_loop);
00506 DO_LOOP_INFO* dli_outer = Get_Do_Loop_Info(wn_outer_loop);
00507 ACCESS_ARRAY* aa_inner_lb = dli_inner->LB;
00508 if (Bound_Is_Too_Messy(aa_inner_lb))
00509 return FALSE;
00510 if (aa_inner_lb->Num_Vec() > 1)
00511 return FALSE;
00512 ACCESS_VECTOR* av_inner_lb = aa_inner_lb->Dim(0);
00513 for (INT i = 0; i < av_inner_lb->Nest_Depth(); i++) {
00514 if (i == dli_outer->Depth) {
00515 if (av_inner_lb->Loop_Coeff(i) != (mINT32) 1)
00516 return FALSE;
00517 } else if (i == dli_inner->Depth) {
00518 if (av_inner_lb->Loop_Coeff(i) != (mINT32) -1)
00519 return FALSE;
00520 } else if (av_inner_lb->Loop_Coeff(i) != 0) {
00521 return FALSE;
00522 }
00523 }
00524 ACCESS_VECTOR* av = CXX_NEW(ACCESS_VECTOR(av_inner_lb, &LNO_local_pool),
00525 &LNO_local_pool);
00526 av->Set_Loop_Coeff(dli_inner->Depth, 0);
00527 return av;
00528 }
00529
00530
00531
00532
00533
00534
00535
00536
00537 static BOOL Loop_Has_Positive_Trip(WN* wn_loop)
00538 {
00539 DO_LOOP_INFO* dli = Get_Do_Loop_Info(wn_loop);
00540 if (dli->LB->Num_Vec() > 1)
00541 return FALSE;
00542 if (dli->UB->Num_Vec() > 1)
00543 return FALSE;
00544 ACCESS_VECTOR* av = Add(dli->LB->Dim(0), dli->UB->Dim(0), &LNO_local_pool);
00545 return av->Is_Const() && av->Const_Offset > 0;
00546 }
00547
00548
00549
00550
00551
00552
00553
00554
00555
00556
00557
00558
00559
00560
00561
00562 static BOOL Access_Vector_Condition_Provable(ACCESS_VECTOR* av,
00563 WN* wn_loop)
00564 {
00565
00566 if (av->Is_Const())
00567 return av->Const_Offset == 0;
00568
00569
00570 INT loop_count = 0;
00571 INT loop_index = -1;
00572 for (INT i = 0; i < av->Nest_Depth(); i++) {
00573 if (av->Loop_Coeff(i) != 0) {
00574 loop_count++;
00575 loop_index = i;
00576 }
00577 }
00578 if (loop_count > 1)
00579 return FALSE;
00580
00581
00582 WN* wn = 0;
00583 for (wn = wn_loop; wn != NULL; wn = LWN_Get_Parent(wn))
00584 if (WN_opcode(wn) == OPC_DO_LOOP && Do_Loop_Depth(wn) == loop_index)
00585 break;
00586 WN* wn_index_loop = wn;
00587 DO_LOOP_INFO* dli_index = Get_Do_Loop_Info(wn_index_loop);
00588 if (!dli_index->Step->Is_Const() || dli_index->Step->Const_Offset < 1)
00589 return FALSE;
00590
00591
00592
00593 if (dli_index->LB->Num_Vec() > 1)
00594 return FALSE;
00595 ACCESS_VECTOR *avs = Subtract(av, dli_index->LB->Dim(0), &LNO_local_pool);
00596 if (avs->Is_Const() && avs->Const_Offset == 0)
00597 return TRUE;
00598
00599
00600 WN* wnn = NULL;
00601 INT if_count = 0;
00602 WN* wn_if = NULL;
00603 WN* wn_branch = NULL;
00604 for (wn = wn_loop; wn != NULL; wnn = wn, wn = LWN_Get_Parent(wn)) {
00605 if (WN_opcode(wn) == OPC_IF) {
00606 if_count++;
00607 wn_if = wn;
00608 wn_branch = wnn;
00609 }
00610 }
00611 if (if_count != 1)
00612 return FALSE;
00613 BOOL is_then_branch = WN_then(wn_if) == wn_branch;
00614 IF_INFO* if_info = Get_If_Info(wn_if);
00615 if (if_info->Condition->Num_Vec() > 1)
00616 return FALSE;
00617 ACCESS_VECTOR av_if(if_info->Condition->Dim(0), &LNO_local_pool);
00618 if (is_then_branch && !if_info->Condition_On_Then
00619 || !is_then_branch && if_info->Condition_On_Then) {
00620 av_if.Mul(-1);
00621 av_if.Const_Offset = -av_if.Const_Offset;
00622 av_if.Const_Offset -= 1;
00623 }
00624 ACCESS_VECTOR *avf = Subtract(av, &av_if, &LNO_local_pool);
00625 if (avf->Is_Const() && avf->Const_Offset == 0)
00626 return TRUE;
00627
00628 return FALSE;
00629 }
00630
00631
00632
00633
00634
00635
00636
00637
00638
00639 static BOOL Outer_LB_GE_Inner_UB(WN* wn_inner_loop,
00640 WN* wn_outer_loop)
00641 {
00642 DO_LOOP_INFO* dli_inner = Get_Do_Loop_Info(wn_inner_loop);
00643 DO_LOOP_INFO* dli_outer = Get_Do_Loop_Info(wn_outer_loop);
00644 ACCESS_ARRAY* aa_outer_lb = dli_outer->LB;
00645 if (Bound_Is_Too_Messy(aa_outer_lb))
00646 return FALSE;
00647 if (aa_outer_lb->Num_Vec() > 1)
00648 return FALSE;
00649 ACCESS_ARRAY* aa_inner_ub = dli_inner->UB;
00650 if (Bound_Is_Too_Messy(aa_inner_ub))
00651 return FALSE;
00652 if (aa_inner_ub->Num_Vec() > 1)
00653 return FALSE;
00654 ACCESS_VECTOR av_outer_lb(aa_outer_lb->Dim(0), &LNO_local_pool);
00655 ACCESS_VECTOR av_inner_ub(aa_inner_ub->Dim(0), &LNO_local_pool);
00656 if (av_outer_lb.Loop_Coeff(dli_outer->Depth) != -1)
00657 return FALSE;
00658 av_outer_lb.Set_Loop_Coeff(dli_outer->Depth, 0);
00659 if (av_inner_ub.Loop_Coeff(dli_inner->Depth) != 1)
00660 return FALSE;
00661 av_inner_ub.Set_Loop_Coeff(dli_inner->Depth, 0);
00662 INT i;
00663 for (i = dli_outer->Depth; i < av_outer_lb.Nest_Depth(); i++)
00664 if (av_outer_lb.Loop_Coeff(i) != 0)
00665 return FALSE;
00666 for (i = dli_outer->Depth; i < av_inner_ub.Nest_Depth(); i++)
00667 if (av_outer_lb.Loop_Coeff(i) != 0)
00668 return FALSE;
00669 av_outer_lb.Set_Nest_Depth(dli_outer->Depth);
00670 av_inner_ub.Set_Nest_Depth(dli_outer->Depth);
00671 ACCESS_VECTOR* av = Add(&av_inner_ub, &av_outer_lb, &LNO_local_pool);
00672 av->Mul(-1);
00673 av->Const_Offset = -av->Const_Offset;
00674 if (Access_Vector_Condition_Provable(av, wn_outer_loop))
00675 return TRUE;
00676 return FALSE;
00677 }
00678
00679
00680
00681
00682
00683
00684
00685
00686 static WN* Perfect_Nested_Outer_Loop(WN* wn_inner_loop)
00687 {
00688 DO_LOOP_INFO* dli_inner = Get_Do_Loop_Info(wn_inner_loop);
00689 if (dli_inner->Depth == 0)
00690 return NULL;
00691 if (WN_prev(wn_inner_loop) != NULL)
00692 return NULL;
00693 WN* wn_outer_loop = LWN_Get_Parent(LWN_Get_Parent(wn_inner_loop));
00694 if (WN_opcode(wn_outer_loop) != OPC_DO_LOOP)
00695 return NULL;
00696 DO_LOOP_INFO* dli_outer = Get_Do_Loop_Info(wn_outer_loop);
00697 if (!dli_inner->Step->Is_Const() || dli_inner->Step->Const_Offset != 1)
00698 return NULL;
00699 if (!dli_outer->Step->Is_Const() || dli_outer->Step->Const_Offset != 1)
00700 return NULL;
00701 if (!Upper_Bound_Standardize(WN_end(wn_inner_loop), TRUE))
00702 return NULL;
00703 if (!Upper_Bound_Standardize(WN_end(wn_outer_loop), TRUE))
00704 return NULL;
00705 return wn_outer_loop;
00706 }
00707
00708
00709
00710
00711
00712
00713
00714 static void Forward_Substitute_For_Access_Arrays(WN* wn_inner_loop,
00715 DU_MANAGER* du)
00716 {
00717 WN* wn_outer_loop = LWN_Get_Parent(LWN_Get_Parent(wn_inner_loop));
00718 FmtAssert(wn_outer_loop != NULL,
00719 ("Should be applied to a pair of coupled loops"));
00720 Forward_Substitute_Ldids(WN_kid0(WN_start(wn_outer_loop)), du);
00721 Forward_Substitute_Ldids(UBexp(WN_end(wn_outer_loop)), du);
00722 Forward_Substitute_Ldids(WN_kid0(WN_start(wn_inner_loop)), du);
00723 Forward_Substitute_Ldids(UBexp(WN_end(wn_inner_loop)), du);
00724 for (WN* wn = wn_inner_loop; wn != NULL; wn = LWN_Get_Parent(wn))
00725 if (WN_opcode(wn) == OPC_IF)
00726 Forward_Substitute_Ldids(WN_if_test(wn), du);
00727 }
00728
00729
00730
00731
00732
00733
00734
00735
00736
00737
00738
00739
00740
00741
00742
00743 static BOOL Unifiable_Loop(WN* wn_inner_loop,
00744 DU_MANAGER* du)
00745 {
00746 WN* wn_outer_loop = Perfect_Nested_Outer_Loop(wn_inner_loop);
00747 if (wn_outer_loop == NULL)
00748 return FALSE;
00749 Forward_Substitute_For_Access_Arrays(wn_inner_loop, du);
00750 if (!Inner_LB_Is_Outer_Index_Variable(wn_inner_loop, wn_outer_loop))
00751 return FALSE;
00752 if (!Loop_Has_Positive_Trip(wn_outer_loop))
00753 return FALSE;
00754 if (Index_Variable_Live_At_Exit(wn_outer_loop))
00755 return FALSE;
00756 if (!Outer_LB_GE_Inner_UB(wn_inner_loop, wn_outer_loop))
00757 return FALSE;
00758 return TRUE;
00759 }
00760
00761
00762
00763
00764
00765
00766
00767
00768
00769
00770
00771
00772
00773 static void Unify_Loop(WN* wn_inner_loop,
00774 DU_MANAGER* du)
00775 {
00776 WN* wn_outer_loop = LWN_Get_Parent(LWN_Get_Parent(wn_inner_loop));
00777 if (LNO_Verbose) {
00778 fprintf(stdout, "Unifying Coupled Loops on lines %d and %d\n",
00779 (INT) WN_linenum(wn_inner_loop), (INT) WN_linenum(wn_outer_loop));
00780 fprintf(TFile, "Unifying Coupled Loops on lines %d and %d\n",
00781 (INT) WN_linenum(wn_inner_loop), (INT) WN_linenum(wn_outer_loop));
00782 }
00783 if (LNO_Tlog)
00784 Generate_Tlog("LNO", "trip_count",
00785 Srcpos_To_Line(WN_linenum(wn_inner_loop)),
00786 (char *) WB_Whirl_Symbol(wn_inner_loop), "", "", "unify-coupled-loops");
00787 Replace_Wnexp_With_Exp_Copy(UBexp(WN_end(wn_outer_loop)),
00788 WN_kid0(WN_start(wn_outer_loop)), du);
00789 Replace_Wnexp_With_Exp_Copy(WN_kid0(WN_start(wn_inner_loop)),
00790 UBexp(WN_end(wn_inner_loop)), du);
00791 DOLOOP_STACK dostack(&LNO_local_pool);
00792 Build_Doloop_Stack(LWN_Get_Parent(wn_outer_loop), &dostack);
00793 LNO_Build_Access(wn_outer_loop, &dostack, &LNO_default_pool);
00794 }
00795
00796
00797
00798
00799
00800
00801
00802
00803
00804 static INT Trip_Reducible_Loop(WN* wn_inner_loop,
00805 DU_MANAGER* du)
00806 {
00807 WN* wn_outer_loop = Perfect_Nested_Outer_Loop(wn_inner_loop);
00808 if (wn_outer_loop == NULL)
00809 return 0;
00810 Forward_Substitute_For_Access_Arrays(wn_inner_loop, du);
00811 if (Index_Variable_Live_At_Exit(wn_outer_loop))
00812 return 0;
00813 ACCESS_VECTOR* av = Inner_LB_Outer_IV_Offset(wn_inner_loop, wn_outer_loop);
00814 if (av == NULL)
00815 return 0;
00816 DO_LOOP_INFO* dli_inner = Get_Do_Loop_Info(wn_inner_loop);
00817 if (dli_inner->UB->Num_Vec() > 1)
00818 return 0;
00819 ACCESS_VECTOR* av_offset = Add(av, dli_inner->UB->Dim(0), &LNO_local_pool);
00820 DO_LOOP_INFO* dli_outer = Get_Do_Loop_Info(wn_outer_loop);
00821 if (dli_outer->UB->Num_Vec() > 1)
00822 return 0;
00823 av_offset->Set_Nest_Depth(dli_outer->Depth + 1);
00824 ACCESS_VECTOR* av_diff = Subtract(dli_outer->UB->Dim(0), av_offset,
00825 &LNO_local_pool);
00826 if (!av_diff->Is_Const() || av_diff->Const_Offset <= 0)
00827 return 0;
00828 return av_diff->Const_Offset;
00829 }
00830
00831
00832
00833
00834
00835
00836
00837 static void Trip_Reduce_Loop(WN* wn_loop,
00838 INT loop_count,
00839 DU_MANAGER* du)
00840 {
00841 if (LNO_Verbose) {
00842 fprintf(stdout, "Trip Reducing Loop on line %d\n",
00843 (INT) WN_linenum(wn_loop));
00844 fprintf(TFile, "Trip Reducing Loop on line %d\n",
00845 (INT) WN_linenum(wn_loop));
00846 }
00847 if (LNO_Tlog)
00848 Generate_Tlog("LNO", "trip_count", Srcpos_To_Line(WN_linenum(wn_loop)),
00849 (char *) WB_Whirl_Symbol(wn_loop), "", "", "trip-reduce-coupled-loops");
00850 DO_LOOP_INFO* dli = Get_Do_Loop_Info(wn_loop);
00851 FmtAssert(!Bound_Is_Too_Messy(dli->UB), ("Should be screened out"));
00852 FmtAssert(dli->UB->Num_Vec() == 1, ("Should be screened out"));
00853 dli->UB->Dim(0)->Const_Offset -= loop_count;
00854 FmtAssert(UBexp(WN_end(wn_loop)), ("Should already be standardized"));
00855 WN* wn_copy = LWN_Copy_Tree(UBexp(WN_end(wn_loop)));
00856 LWN_Copy_Def_Use(UBexp(WN_end(wn_loop)), wn_copy, du);
00857 WN* wn_diff = LWN_Make_Icon(WN_rtype(wn_copy), -loop_count);
00858 TYPE_ID type_add = WN_rtype(wn_copy);
00859 OPCODE op_add = OPCODE_make_op(OPR_ADD, type_add, MTYPE_V);
00860 WN* wn_exp = LWN_CreateExp2(op_add, wn_copy, wn_diff);
00861 Replace_Wnexp_With_Exp_Copy(UBexp(WN_end(wn_loop)), wn_exp, du);
00862 LWN_Delete_Tree(wn_exp);
00863 }
00864
00865
00866
00867
00868
00869
00870 static void Coupled_Loops_Traverse(WN* wn_tree,
00871 DU_MANAGER* du)
00872 {
00873 if (WN_opcode(wn_tree) == OPC_DO_LOOP) {
00874 if (Unifiable_Loop(wn_tree, du))
00875 Unify_Loop(wn_tree, du);
00876 INT reduce_count = Trip_Reducible_Loop(wn_tree, du);
00877 if (reduce_count > 0)
00878 Trip_Reduce_Loop(LWN_Get_Parent(LWN_Get_Parent(wn_tree)),
00879 reduce_count, du);
00880 DO_LOOP_INFO* dli = Get_Do_Loop_Info(wn_tree);
00881 if (dli->Is_Inner)
00882 return;
00883 }
00884
00885 if (WN_opcode(wn_tree) == OPC_BLOCK) {
00886 for (WN* wn = WN_first(wn_tree); wn != NULL; wn = WN_next(wn))
00887 Coupled_Loops_Traverse(wn, du);
00888 } else {
00889 for (INT i = 0; i < WN_kid_count(wn_tree); i++)
00890 Coupled_Loops_Traverse(WN_kid(wn_tree, i), du);
00891 }
00892 }
00893
00894
00895
00896
00897
00898
00899
00900 extern void Optimize_Coupled_Loops(WN* wn_tree,
00901 DU_MANAGER* du)
00902 {
00903 if (!LNO_Coupled_Opts)
00904 return;
00905 Coupled_Loops_Traverse(wn_tree, du);
00906 }
00907
00908
00909
00910
00911
00912
00913
00914 static BOOL Has_Scalar_Use_Inside_Loop(WN* wn_def,
00915 WN* wn_loop,
00916 DU_MANAGER* du)
00917 {
00918
00919 if (WN_operator(wn_def) == OPR_ISTORE)
00920 return FALSE;
00921 USE_LIST *use_list = du->Du_Get_Use(wn_def);
00922 if (use_list == NULL)
00923 return FALSE;
00924 if (use_list->Incomplete())
00925 return TRUE;
00926 USE_LIST_ITER iter(use_list);
00927 const DU_NODE* node = NULL;
00928 for (node = iter.First(); !iter.Is_Empty(); node = iter.Next()) {
00929 WN* wn_use = node->Wn();
00930 if (Wn_Is_Inside(wn_use, wn_loop))
00931 return TRUE;
00932 }
00933 return FALSE;
00934 }
00935
00936
00937
00938
00939
00940
00941
00942
00943 static BOOL Has_Array_Dep_Carried_Inside_Loop(WN* wn_def,
00944 WN* wn_loop,
00945 ARRAY_DIRECTED_GRAPH16* dg)
00946 {
00947 VINDEX16 v = dg->Get_Vertex(wn_def);
00948 if (v == 0)
00949 return !WN_operator(wn_def) == OPR_STID;
00950 EINDEX16 e = 0;
00951 for (e = dg->Get_In_Edge(v); e != 0; e = dg->Get_Next_In_Edge(e)) {
00952 WN* wn_source = dg->Get_Wn(dg->Get_Source(e));
00953 if (wn_source == wn_def)
00954 continue;
00955 DEPV_ARRAY* dva = dg->Depv_Array(e);
00956 INT dep_depth = dva->Loop_Carrying_Dependence();
00957 if (dep_depth >= Do_Loop_Depth(wn_loop))
00958 return TRUE;
00959 }
00960 for (e = dg->Get_Out_Edge(v); e != 0; e = dg->Get_Next_Out_Edge(e)) {
00961 DEPV_ARRAY* dva = dg->Depv_Array(e);
00962 WN* wn_sink = dg->Get_Wn(dg->Get_Sink(e));
00963 if (wn_sink == wn_def)
00964 continue;
00965 INT dep_depth = dva->Loop_Carrying_Dependence();
00966 if (dep_depth >= Do_Loop_Depth(wn_loop))
00967 return TRUE;
00968 }
00969 return FALSE;
00970 }
00971
00972
00973
00974
00975
00976
00977
00978 static BOOL Has_Complex_Access_Array(WN* wn_def,
00979 WN* wn_loop)
00980 {
00981 if (WN_operator(wn_def) != OPR_ISTORE)
00982 return FALSE;
00983 WN* wn_array = WN_kid1(wn_def);
00984 if (WN_operator(wn_array) != OPR_ARRAY)
00985 return TRUE;
00986 ACCESS_ARRAY *aa = (ACCESS_ARRAY *) WN_MAP_Get(LNO_Info_Map, wn_array);
00987 if (Bound_Is_Too_Messy(aa))
00988 return TRUE;
00989 if (aa->Non_Const_Loops() > Do_Loop_Depth(wn_loop))
00990 return TRUE;
00991 return FALSE;
00992 }
00993
00994
00995
00996
00997
00998
00999
01000 static void Mark_Indexed_References(WN* wn_def,
01001 INT indexed[])
01002 {
01003 if (WN_operator(wn_def) != OPR_ISTORE)
01004 return;
01005 WN* wn_array = WN_kid1(wn_def);
01006 if (WN_operator(wn_array) != OPR_ARRAY)
01007 return;
01008 ACCESS_ARRAY* aa = (ACCESS_ARRAY *) WN_MAP_Get(LNO_Info_Map, wn_array);
01009 for (INT i = 0; i < aa->Num_Vec(); i++) {
01010 ACCESS_VECTOR* av = aa->Dim(i);
01011 for (INT j = 0; j < av->Nest_Depth(); j++)
01012 if (av->Loop_Coeff(j) != 0)
01013 indexed[j] = TRUE;
01014 }
01015 }
01016
01017
01018
01019
01020
01021
01022
01023
01024 static ACCESS_VECTOR* Access_Trip_Count(WN *wn_outer_loop,
01025 WN* wn_loop)
01026 {
01027 DO_LOOP_INFO* dli = Get_Do_Loop_Info(wn_loop);
01028 if (dli->LB->Num_Vec() > 1 || Bound_Is_Too_Messy(dli->LB)
01029 || dli->LB->Non_Const_Loops() > Do_Loop_Depth(wn_outer_loop))
01030 return NULL;
01031 if (dli->UB->Num_Vec() > 1 || Bound_Is_Too_Messy(dli->UB)
01032 || dli->UB->Non_Const_Loops() > Do_Loop_Depth(wn_outer_loop))
01033 return NULL;
01034 ACCESS_VECTOR* av = Add(dli->UB->Dim(0), dli->LB->Dim(0), &LNO_local_pool);
01035 av->Mul(-1);
01036 av->Const_Offset += 1;
01037 return av;
01038 }
01039
01040
01041
01042
01043
01044
01045
01046
01047
01048
01049 static void Discard_Possibly_Empty_Loops(WN* wn_loop,
01050 INT nest_depth,
01051 BOOL indexed[])
01052 {
01053 ACCESS_VECTOR** av_trip = CXX_NEW_ARRAY(ACCESS_VECTOR*, nest_depth + 1,
01054 &LNO_local_pool);
01055 INT i;
01056 for (i = 0; i <= nest_depth; i++)
01057 av_trip[i] = NULL;
01058 WN* wn = 0;
01059 for (wn = wn_loop; wn != NULL; wn = Find_Next_Innermost_Do(wn))
01060 if (!indexed[Do_Loop_Depth(wn)])
01061 break;
01062 if (wn == NULL)
01063 return;
01064 WN* wn_first = wn;
01065 INT first_index = Do_Loop_Depth(wn_first);
01066 for (wn = wn_first; wn != NULL; wn = Find_Next_Innermost_Do(wn))
01067 av_trip[Do_Loop_Depth(wn)] = Access_Trip_Count(wn_loop, wn);
01068 for (wn = wn_first; wn != NULL; wn = Find_Next_Innermost_Do(wn)) {
01069 i = Do_Loop_Depth(wn);
01070 if (indexed[i])
01071 continue;
01072 for (INT j = Do_Loop_Depth(wn) + 1; j <= nest_depth; j++) {
01073 if (av_trip[j] == NULL || av_trip[j]->Loop_Coeff(i) < 0) {
01074 indexed[Do_Loop_Depth(wn)] = TRUE;
01075 break;
01076 }
01077 }
01078 }
01079 }
01080
01081
01082
01083
01084
01085
01086
01087
01088 static void Set_Indexed_Loop_Bounds(ACCESS_ARRAY* aa,
01089 INT loop_depth,
01090 BOOL indexed[],
01091 BOOL is_upper_bound)
01092 {
01093 if (aa == NULL || aa->Too_Messy) {
01094 for (INT i = 0; i < loop_depth; i++)
01095 indexed[i] = TRUE;
01096 return;
01097 }
01098 INT i;
01099 for (i = 0; i < aa->Num_Vec(); i++) {
01100 ACCESS_VECTOR* av = aa->Dim(i);
01101 if (!av->Has_Loop_Coeff()) {
01102 for (INT j = 0; j < loop_depth; j++)
01103 indexed[j] = TRUE;
01104 return;
01105 }
01106 if (is_upper_bound) {
01107 for (INT j = 0; j < loop_depth; j++)
01108 if (av->Loop_Coeff(j) > 0)
01109 indexed[j] = TRUE;
01110 } else {
01111 for (INT j = 0; j < loop_depth; j++)
01112 if (av->Loop_Coeff(j) != 0)
01113 indexed[j] = TRUE;
01114 }
01115 }
01116 INT const_limit = aa->Non_Const_Loops();
01117 if (const_limit > loop_depth)
01118 const_limit = loop_depth;
01119 for (i = 0; i < const_limit; i++)
01120 indexed[i] = TRUE;
01121 }
01122
01123
01124
01125
01126
01127
01128
01129 extern DOLOOP_STACK* SNL_Finalizable_Loops(WN* wn_loop,
01130 ARRAY_DIRECTED_GRAPH16* dg,
01131 DU_MANAGER* du)
01132 {
01133 DOLOOP_STACK* stack_final
01134 = CXX_NEW(DOLOOP_STACK(&LNO_default_pool), &LNO_default_pool);
01135
01136 if (!LNO_Loop_Finalization || wn_loop == NULL)
01137 return stack_final;
01138
01139 if (!Do_Loop_Is_Good(wn_loop) || Is_Nested_Doacross(wn_loop) ||
01140 Do_Loop_Has_Gotos(wn_loop))
01141 return SNL_Finalizable_Loops(Good_Do_Next_Innermost(wn_loop), dg, du);
01142
01143 INT nest_depth = 0;
01144 WN* wn = 0;
01145 for (wn = wn_loop; wn != NULL; wn = Find_Next_Innermost_Do(wn)) {
01146 nest_depth = Do_Loop_Depth(wn);
01147 WN* wn_first = WN_first(WN_do_body(wn));
01148 for (WN* wnn = wn_first; wnn != NULL; wnn = WN_next(wnn)) {
01149 if (WN_opcode(wnn) == OPC_DO_LOOP)
01150 continue;
01151 if (OPCODE_is_not_executable(WN_opcode(wnn)))
01152 continue;
01153 if (!OPCODE_is_store(WN_opcode(wnn)))
01154 return SNL_Finalizable_Loops(Find_Next_Innermost_Do(wn), dg, du);
01155 if (Has_Scalar_Use_Inside_Loop(wnn, wn_loop, du))
01156 return SNL_Finalizable_Loops(Find_Next_Innermost_Do(wn_loop), dg, du);
01157 if (Has_Array_Dep_Carried_Inside_Loop(wnn, wn_loop, dg))
01158 return SNL_Finalizable_Loops(Find_Next_Innermost_Do(wn_loop), dg, du);
01159 if (Has_Complex_Access_Array(wnn, wn_loop))
01160 return SNL_Finalizable_Loops(Find_Next_Innermost_Do(wn_loop), dg, du);
01161 }
01162 }
01163
01164 BOOL* indexed = CXX_NEW_ARRAY(BOOL, nest_depth + 1, &LNO_local_pool);
01165 INT i;
01166 for (i = 0; i <= nest_depth; i++)
01167 indexed[i] = FALSE;
01168 for (wn = wn_loop; wn != NULL; wn = Find_Next_Innermost_Do(wn)) {
01169 WN* wn_first = WN_first(WN_do_body(wn));
01170 for (WN* wnn = wn_first; wnn != NULL; wnn = WN_next(wnn))
01171 Mark_Indexed_References(wnn, indexed);
01172 }
01173 for (wn = wn_loop; wn != NULL; wn = Find_Next_Innermost_Do(wn)) {
01174 DO_LOOP_INFO* dli = Get_Do_Loop_Info(wn);
01175 Set_Indexed_Loop_Bounds(dli->LB, dli->Depth, indexed, FALSE);
01176 Set_Indexed_Loop_Bounds(dli->UB, dli->Depth, indexed, TRUE);
01177 }
01178 Discard_Possibly_Empty_Loops(wn_loop, nest_depth, indexed);
01179
01180 WN* wn_candidate = wn_loop;
01181 for (i = Do_Depth(wn_loop); i <= nest_depth; i++) {
01182 if (!indexed[i])
01183 stack_final->Push(wn_candidate);
01184 wn_candidate = Find_Next_Innermost_Do(wn_candidate);
01185 }
01186 return stack_final;
01187 }
01188
01189
01190
01191
01192
01193
01194
01195 static INT First_Invariant_Depth(WN* wn_loop,
01196 ACCESS_ARRAY* aa)
01197 {
01198 if (Bound_Is_Too_Messy(aa))
01199 return Do_Loop_Depth(wn_loop);
01200 INT depth = aa->Non_Const_Loops();
01201 for (INT i = 0; i < aa->Num_Vec(); i++) {
01202 ACCESS_VECTOR* av = aa->Dim(i);
01203 for (INT j = 0; j < av->Nest_Depth() - 1; j++)
01204 if (av->Loop_Coeff(j) != 0)
01205 depth = j + 1;
01206 }
01207 return depth;
01208 }
01209
01210
01211
01212
01213
01214
01215
01216 extern WN* SNL_Finalize_Loops(WN* wn_outer_loop,
01217 DOLOOP_STACK* stack_final,
01218 ARRAY_DIRECTED_GRAPH16* dg,
01219 DU_MANAGER* du)
01220 {
01221 WN* wn_first = NULL;
01222 WN* wn_last = NULL;
01223 WN* wn_return = wn_outer_loop;
01224 for (INT i = 0; i < stack_final->Elements(); i++) {
01225 WN* wn_loop = stack_final->Bottom_nth(i);
01226 if (LNO_Verbose) {
01227 fprintf(stdout, "Finalizing Loop on line %d\n",
01228 (INT) WN_linenum(wn_loop));
01229 fprintf(TFile, "Finalizing Loop on line %d\n",
01230 (INT) WN_linenum(wn_loop));
01231 }
01232 if (LNO_Tlog)
01233 Generate_Tlog("LNO", "trip_count", Srcpos_To_Line(WN_linenum(wn_loop)),
01234 (char *) WB_Whirl_Symbol(wn_loop), "", "", "finalize-loop");
01235 DO_LOOP_INFO* dli = Get_Do_Loop_Info(wn_loop);
01236 if (!Upper_Bound_Standardize(WN_end(wn_loop), TRUE))
01237 continue;
01238 if (Bound_Is_Too_Messy(dli->LB) || Bound_Is_Too_Messy(dli->UB))
01239 continue;
01240 if (!dli->Step->Is_Const() || dli->Step->Const_Offset != 1)
01241 continue;
01242 if (COND_Do_Info(wn_loop, &LNO_local_pool) != COND_DO_AT_LEAST_ONCE) {
01243 WN* wn_guard = Guard_A_Do(wn_loop);
01244 WN_Reset_If_Guard(wn_guard);
01245 }
01246 wn_return = Find_Next_Innermost_Do(wn_loop);
01247 Replace_Wnexp_With_Exp_Copy(WN_kid0(WN_start(wn_loop)),
01248 UBexp(WN_end(wn_loop)), du);
01249 CXX_DELETE(dli->LB, &LNO_default_pool);
01250 dli->LB = CXX_NEW(ACCESS_ARRAY(dli->UB, &LNO_default_pool),
01251 &LNO_default_pool);
01252 for (INT j = 0; j < dli->LB->Num_Vec(); j++)
01253 dli->LB->Dim(j)->Negate_Me();
01254 Remove_Unity_Trip_Loop(wn_loop, TRUE, &wn_first, &wn_last, dg, du);
01255 }
01256 return wn_return;
01257 }
01258
01259
01260
01261
01262
01263
01264
01265 extern void Finalize_Loops(WN* func_nd)
01266 {
01267 if (!LNO_Loop_Finalization)
01268 return;
01269
01270 ARRAY_DIRECTED_GRAPH16* dg = Array_Dependence_Graph;
01271 DU_MANAGER* du = Du_Mgr;
01272
01273 FIZ_FUSE_INFO* ffi=
01274 CXX_NEW(FIZ_FUSE_INFO(&LNO_local_pool), &LNO_local_pool);
01275 ffi->Build(func_nd);
01276
01277 for (INT i = 0; i < ffi->Num_Snl(); i++) {
01278 WN* wn = ffi->Get_Wn(i);
01279 if (ffi->Get_Type(i) != Inner)
01280 continue;
01281 DOLOOP_STACK* final_stack = SNL_Finalizable_Loops(wn, dg, du);
01282 SNL_Finalize_Loops(wn, final_stack, dg, du);
01283 CXX_DELETE(final_stack, &LNO_default_pool);
01284 }
01285 }
01286
01287
01288 static void
01289 Update_Def_List_Loop_Stmt(WN* old_loop, WN* new_loop)
01290 {
01291 LWN_ITER* itr = LWN_WALK_TreeIter(WN_do_body(old_loop));
01292 for (; itr; itr = LWN_WALK_TreeNext(itr)) {
01293 WN* wn = itr->wn;
01294 DEF_LIST *def_list = Du_Mgr->Ud_Get_Def(wn);
01295 if (def_list) {
01296 if (def_list->Loop_stmt() == old_loop) {
01297 def_list->Set_loop_stmt(new_loop);
01298 }
01299 }
01300 }
01301 }
01302
01303
01304
01305
01306
01307
01308
01309 extern void
01310 Unroll_Loop_By_Trip_Count(WN* outerloop, INT u)
01311 {
01312 INT i;
01313
01314
01315
01316
01317
01318
01319 SYMBOL indexsym(WN_index(outerloop));
01320 indexsym.Type = Do_Wtype(outerloop);
01321
01322 INT depth = Do_Loop_Depth(outerloop);
01323
01324
01325 INT64 ostep = Step_Size(outerloop);
01326 ostep = Step_Size(outerloop, u*ostep);
01327
01328
01329 WN** unroll_body = CXX_NEW_ARRAY(WN*, u, &LNO_local_pool);
01330
01331 unroll_body[0] = outerloop;
01332 LWN_Scale_Frequency(WN_end(outerloop), 1.0/u);
01333 LWN_Scale_Frequency(WN_step(outerloop), 1.0/u);
01334 for (i = 1; i < u; i++) {
01335 unroll_body[i] = LWN_Copy_Tree(outerloop, TRUE, LNO_Info_Map);
01336 LWN_Scale_Frequency_Tree(unroll_body[i], 1.0/u);
01337 }
01338
01339 Unrolled_DU_Update(unroll_body, u, depth, TRUE, TRUE);
01340
01341
01342 for (i = 1; i < u; i++) {
01343 Add_To_Symbol(unroll_body[i], i*ostep, indexsym, TRUE);
01344 }
01345
01346 for (i = 1; i < u; i++) {
01347 Update_Def_List_Loop_Stmt(unroll_body[i], outerloop);
01348
01349
01350 LWN_Update_Def_Use_Delete_Tree(WN_start(unroll_body[i]));
01351 LWN_Update_Def_Use_Delete_Tree(WN_end(unroll_body[i]));
01352 LWN_Update_Def_Use_Delete_Tree(WN_step(unroll_body[i]));
01353 }
01354
01355 for (i = 1; i < u; i++) {
01356 LWN_Insert_Block_After(WN_do_body(outerloop),
01357 WN_last(WN_do_body(outerloop)),
01358 WN_do_body(unroll_body[i]));
01359 }
01360 }