-
Notifications
You must be signed in to change notification settings - Fork 12.1k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Loop transformations can sometimes fail because the loop, while in valid rotated LCSSA form, is not in a canonical CFG form. This is an extremely simple pass that just merges obviously redundant blocks, which can be used to fix some known failure cases. In the future, it may be enhanced with more cases (and have code shared with SimplifyCFG). This allows us to run LoopSimplifyCFG -> LoopRotate -> LoopUnroll, so that SimplifyCFG cleans up the loop before Rotate tries to run. Not currently used in the pass manager, since this pass doesn't do anything unless you can hook it up in an LPM with other loop passes. It'll be added once Chandler cleans up things to allow this. Tested in a custom pipeline out of tree to confirm it works in practice (in addition to the included trivial test). llvm-svn: 259256
- Loading branch information
Fiona Glaser
committed
Jan 29, 2016
1 parent
9c98105
commit b417d46
Showing
7 changed files
with
160 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,111 @@ | ||
//===--------- LoopSimplifyCFG.cpp - Loop CFG Simplification Pass ---------===// | ||
// | ||
// The LLVM Compiler Infrastructure | ||
// | ||
// This file is distributed under the University of Illinois Open Source | ||
// License. See LICENSE.TXT for details. | ||
// | ||
//===----------------------------------------------------------------------===// | ||
// | ||
// This file implements the Loop SimplifyCFG Pass. This pass is responsible for | ||
// basic loop CFG cleanup, primarily to assist other loop passes. If you | ||
// encounter a noncanonical CFG construct that causes another loop pass to | ||
// perform suboptimally, this is the place to fix it up. | ||
// | ||
//===----------------------------------------------------------------------===// | ||
|
||
#include "llvm/Transforms/Scalar.h" | ||
#include "llvm/ADT/SmallVector.h" | ||
#include "llvm/ADT/Statistic.h" | ||
#include "llvm/Analysis/AliasAnalysis.h" | ||
#include "llvm/Analysis/BasicAliasAnalysis.h" | ||
#include "llvm/Analysis/AssumptionCache.h" | ||
#include "llvm/Analysis/DependenceAnalysis.h" | ||
#include "llvm/Analysis/GlobalsModRef.h" | ||
#include "llvm/Analysis/LoopInfo.h" | ||
#include "llvm/Analysis/LoopPass.h" | ||
#include "llvm/Analysis/ScalarEvolution.h" | ||
#include "llvm/Analysis/ScalarEvolutionAliasAnalysis.h" | ||
#include "llvm/Analysis/TargetTransformInfo.h" | ||
#include "llvm/IR/Dominators.h" | ||
#include "llvm/Transforms/Utils/Local.h" | ||
using namespace llvm; | ||
|
||
#define DEBUG_TYPE "loop-simplifycfg" | ||
|
||
namespace { | ||
class LoopSimplifyCFG : public LoopPass { | ||
public: | ||
static char ID; // Pass ID, replacement for typeid | ||
LoopSimplifyCFG() : LoopPass(ID) { | ||
initializeLoopSimplifyCFGPass(*PassRegistry::getPassRegistry()); | ||
} | ||
|
||
bool runOnLoop(Loop *L, LPPassManager &) override; | ||
|
||
void getAnalysisUsage(AnalysisUsage &AU) const override { | ||
AU.addRequired<DominatorTreeWrapperPass>(); | ||
AU.addRequired<LoopInfoWrapperPass>(); | ||
|
||
AU.addPreserved<DominatorTreeWrapperPass>(); | ||
AU.addPreserved<LoopInfoWrapperPass>(); | ||
AU.addPreserved<GlobalsAAWrapperPass>(); | ||
AU.addPreserved<BasicAAWrapperPass>(); | ||
AU.addPreserved<AAResultsWrapperPass>(); | ||
AU.addPreserved<ScalarEvolutionWrapperPass>(); | ||
AU.addPreserved<SCEVAAWrapperPass>(); | ||
AU.addPreserved<DependenceAnalysis>(); | ||
AU.addPreservedID(LoopSimplifyID); | ||
AU.addPreservedID(LCSSAID); | ||
} | ||
}; | ||
} | ||
|
||
char LoopSimplifyCFG::ID = 0; | ||
INITIALIZE_PASS_BEGIN(LoopSimplifyCFG, "loop-simplifycfg", "Simplify loop CFG", | ||
false, false) | ||
INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) | ||
INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass) | ||
INITIALIZE_PASS_END(LoopSimplifyCFG, "loop-simplifycfg", "Simplify loop CFG", | ||
false, false) | ||
|
||
Pass *llvm::createLoopSimplifyCFGPass() { return new LoopSimplifyCFG(); } | ||
|
||
static bool simplifyLoopCFG(Loop *L, DominatorTree *DT, LoopInfo *LI) { | ||
bool Changed = false; | ||
// Copy blocks into a temporary array to avoid iterator invalidation issues | ||
// as we remove them. | ||
SmallVector<WeakVH, 16> Blocks(L->blocks()); | ||
|
||
for (auto &Block : Blocks) { | ||
// Attempt to merge blocks in the trivial case. Don't modify blocks which | ||
// belong to other loops. | ||
BasicBlock *Succ = cast<BasicBlock>(Block); | ||
if (!Succ) | ||
continue; | ||
|
||
BasicBlock *Pred = Succ->getSinglePredecessor(); | ||
if (!Pred || !Pred->getSingleSuccessor() || LI->getLoopFor(Pred) != L) | ||
continue; | ||
|
||
// Pred is going to disappear, so we need to update the loop info. | ||
if (L->getHeader() == Pred) | ||
L->moveToHeader(Succ); | ||
LI->removeBlock(Pred); | ||
MergeBasicBlockIntoOnlyPred(Succ, DT); | ||
Changed = true; | ||
} | ||
|
||
return Changed; | ||
} | ||
|
||
/// runOnLoop - Perform basic CFG simplifications to assist other loop passes. | ||
/// For now, this only attempts to merge blocks in the trivial case. | ||
bool LoopSimplifyCFG::runOnLoop(Loop *L, LPPassManager &) { | ||
if (skipOptnoneFunction(L)) | ||
return false; | ||
|
||
DominatorTree *DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree(); | ||
LoopInfo *LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo(); | ||
return simplifyLoopCFG(L, DT, LI); | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,34 @@ | ||
; RUN: opt -S -loop-simplifycfg < %s | FileCheck %s | ||
|
||
; CHECK-LABEL: foo | ||
; CHECK: entry: | ||
; CHECK-NEXT: br label %[[LOOP:[a-z]+]] | ||
; CHECK: [[LOOP]]: | ||
; CHECK-NEXT: phi | ||
; CHECK-NOT: br label | ||
; CHECK: br i1 | ||
define i32 @foo(i32* %P, i64* %Q) { | ||
entry: | ||
br label %outer | ||
|
||
outer: ; preds = %outer.latch2, %entry | ||
%y.2 = phi i32 [ 0, %entry ], [ %y.inc2, %outer.latch2 ] | ||
br label %inner | ||
|
||
inner: ; preds = %outer | ||
store i32 0, i32* %P | ||
store i32 1, i32* %P | ||
store i32 2, i32* %P | ||
%y.inc2 = add nsw i32 %y.2, 1 | ||
%exitcond.outer = icmp eq i32 %y.inc2, 3 | ||
store i32 %y.2, i32* %P | ||
br i1 %exitcond.outer, label %exit, label %outer.latch2 | ||
|
||
outer.latch2: ; preds = %inner | ||
%t = sext i32 %y.inc2 to i64 | ||
store i64 %t, i64* %Q | ||
br label %outer | ||
|
||
exit: ; preds = %inner | ||
ret i32 0 | ||
} |