1 //===-- SIAnnotateControlFlow.cpp -  ------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 /// \file
11 /// Annotates the control flow with hardware specific intrinsics.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "AMDGPU.h"
16 #include "llvm/ADT/DepthFirstIterator.h"
17 #include "llvm/Analysis/DivergenceAnalysis.h"
18 #include "llvm/Analysis/LoopInfo.h"
19 #include "llvm/IR/Constants.h"
20 #include "llvm/IR/Dominators.h"
21 #include "llvm/IR/Instructions.h"
22 #include "llvm/IR/Module.h"
23 #include "llvm/Pass.h"
24 #include "llvm/Transforms/Utils/BasicBlockUtils.h"
25 #include "llvm/Transforms/Utils/SSAUpdater.h"
26 
27 using namespace llvm;
28 
29 #define DEBUG_TYPE "si-annotate-control-flow"
30 
31 namespace {
32 
33 // Complex types used in this pass
34 typedef std::pair<BasicBlock *, Value *> StackEntry;
35 typedef SmallVector<StackEntry, 16> StackVector;
36 
37 // Intrinsic names the control flow is annotated with
38 static const char *const IfIntrinsic = "llvm.amdgcn.if";
39 static const char *const ElseIntrinsic = "llvm.amdgcn.else";
40 static const char *const BreakIntrinsic = "llvm.amdgcn.break";
41 static const char *const IfBreakIntrinsic = "llvm.amdgcn.if.break";
42 static const char *const ElseBreakIntrinsic = "llvm.amdgcn.else.break";
43 static const char *const LoopIntrinsic = "llvm.amdgcn.loop";
44 static const char *const EndCfIntrinsic = "llvm.amdgcn.end.cf";
45 
46 class SIAnnotateControlFlow : public FunctionPass {
47   DivergenceAnalysis *DA;
48 
49   Type *Boolean;
50   Type *Void;
51   Type *Int64;
52   Type *ReturnStruct;
53 
54   ConstantInt *BoolTrue;
55   ConstantInt *BoolFalse;
56   UndefValue *BoolUndef;
57   Constant *Int64Zero;
58 
59   Constant *If;
60   Constant *Else;
61   Constant *Break;
62   Constant *IfBreak;
63   Constant *ElseBreak;
64   Constant *Loop;
65   Constant *EndCf;
66 
67   DominatorTree *DT;
68   StackVector Stack;
69 
70   LoopInfo *LI;
71 
72   bool isUniform(BranchInst *T);
73 
74   bool isTopOfStack(BasicBlock *BB);
75 
76   Value *popSaved();
77 
78   void push(BasicBlock *BB, Value *Saved);
79 
80   bool isElse(PHINode *Phi);
81 
82   void eraseIfUnused(PHINode *Phi);
83 
84   void openIf(BranchInst *Term);
85 
86   void insertElse(BranchInst *Term);
87 
88   Value *handleLoopCondition(Value *Cond, PHINode *Broken,
89                              llvm::Loop *L, BranchInst *Term);
90 
91   void handleLoop(BranchInst *Term);
92 
93   void closeControlFlow(BasicBlock *BB);
94 
95 public:
96   static char ID;
97 
SIAnnotateControlFlow()98   SIAnnotateControlFlow():
99     FunctionPass(ID) { }
100 
101   bool doInitialization(Module &M) override;
102 
103   bool runOnFunction(Function &F) override;
104 
getPassName() const105   const char *getPassName() const override {
106     return "SI annotate control flow";
107   }
108 
getAnalysisUsage(AnalysisUsage & AU) const109   void getAnalysisUsage(AnalysisUsage &AU) const override {
110     AU.addRequired<LoopInfoWrapperPass>();
111     AU.addRequired<DominatorTreeWrapperPass>();
112     AU.addRequired<DivergenceAnalysis>();
113     AU.addPreserved<DominatorTreeWrapperPass>();
114     FunctionPass::getAnalysisUsage(AU);
115   }
116 
117 };
118 
119 } // end anonymous namespace
120 
121 INITIALIZE_PASS_BEGIN(SIAnnotateControlFlow, DEBUG_TYPE,
122                       "Annotate SI Control Flow", false, false)
123 INITIALIZE_PASS_DEPENDENCY(DivergenceAnalysis)
124 INITIALIZE_PASS_END(SIAnnotateControlFlow, DEBUG_TYPE,
125                     "Annotate SI Control Flow", false, false)
126 
127 char SIAnnotateControlFlow::ID = 0;
128 
129 /// \brief Initialize all the types and constants used in the pass
doInitialization(Module & M)130 bool SIAnnotateControlFlow::doInitialization(Module &M) {
131   LLVMContext &Context = M.getContext();
132 
133   Void = Type::getVoidTy(Context);
134   Boolean = Type::getInt1Ty(Context);
135   Int64 = Type::getInt64Ty(Context);
136   ReturnStruct = StructType::get(Boolean, Int64, (Type *)nullptr);
137 
138   BoolTrue = ConstantInt::getTrue(Context);
139   BoolFalse = ConstantInt::getFalse(Context);
140   BoolUndef = UndefValue::get(Boolean);
141   Int64Zero = ConstantInt::get(Int64, 0);
142 
143   If = M.getOrInsertFunction(
144     IfIntrinsic, ReturnStruct, Boolean, (Type *)nullptr);
145 
146   Else = M.getOrInsertFunction(
147     ElseIntrinsic, ReturnStruct, Int64, (Type *)nullptr);
148 
149   Break = M.getOrInsertFunction(
150     BreakIntrinsic, Int64, Int64, (Type *)nullptr);
151 
152   IfBreak = M.getOrInsertFunction(
153     IfBreakIntrinsic, Int64, Boolean, Int64, (Type *)nullptr);
154 
155   ElseBreak = M.getOrInsertFunction(
156     ElseBreakIntrinsic, Int64, Int64, Int64, (Type *)nullptr);
157 
158   Loop = M.getOrInsertFunction(
159     LoopIntrinsic, Boolean, Int64, (Type *)nullptr);
160 
161   EndCf = M.getOrInsertFunction(
162     EndCfIntrinsic, Void, Int64, (Type *)nullptr);
163 
164   return false;
165 }
166 
167 /// \brief Is the branch condition uniform or did the StructurizeCFG pass
168 /// consider it as such?
isUniform(BranchInst * T)169 bool SIAnnotateControlFlow::isUniform(BranchInst *T) {
170   return DA->isUniform(T->getCondition()) ||
171          T->getMetadata("structurizecfg.uniform") != nullptr;
172 }
173 
174 /// \brief Is BB the last block saved on the stack ?
isTopOfStack(BasicBlock * BB)175 bool SIAnnotateControlFlow::isTopOfStack(BasicBlock *BB) {
176   return !Stack.empty() && Stack.back().first == BB;
177 }
178 
179 /// \brief Pop the last saved value from the control flow stack
popSaved()180 Value *SIAnnotateControlFlow::popSaved() {
181   return Stack.pop_back_val().second;
182 }
183 
184 /// \brief Push a BB and saved value to the control flow stack
push(BasicBlock * BB,Value * Saved)185 void SIAnnotateControlFlow::push(BasicBlock *BB, Value *Saved) {
186   Stack.push_back(std::make_pair(BB, Saved));
187 }
188 
189 /// \brief Can the condition represented by this PHI node treated like
190 /// an "Else" block?
isElse(PHINode * Phi)191 bool SIAnnotateControlFlow::isElse(PHINode *Phi) {
192   BasicBlock *IDom = DT->getNode(Phi->getParent())->getIDom()->getBlock();
193   for (unsigned i = 0, e = Phi->getNumIncomingValues(); i != e; ++i) {
194     if (Phi->getIncomingBlock(i) == IDom) {
195 
196       if (Phi->getIncomingValue(i) != BoolTrue)
197         return false;
198 
199     } else {
200       if (Phi->getIncomingValue(i) != BoolFalse)
201         return false;
202 
203     }
204   }
205   return true;
206 }
207 
208 // \brief Erase "Phi" if it is not used any more
eraseIfUnused(PHINode * Phi)209 void SIAnnotateControlFlow::eraseIfUnused(PHINode *Phi) {
210   if (!Phi->hasNUsesOrMore(1))
211     Phi->eraseFromParent();
212 }
213 
214 /// \brief Open a new "If" block
openIf(BranchInst * Term)215 void SIAnnotateControlFlow::openIf(BranchInst *Term) {
216   if (isUniform(Term)) {
217     return;
218   }
219   Value *Ret = CallInst::Create(If, Term->getCondition(), "", Term);
220   Term->setCondition(ExtractValueInst::Create(Ret, 0, "", Term));
221   push(Term->getSuccessor(1), ExtractValueInst::Create(Ret, 1, "", Term));
222 }
223 
224 /// \brief Close the last "If" block and open a new "Else" block
insertElse(BranchInst * Term)225 void SIAnnotateControlFlow::insertElse(BranchInst *Term) {
226   if (isUniform(Term)) {
227     return;
228   }
229   Value *Ret = CallInst::Create(Else, popSaved(), "", Term);
230   Term->setCondition(ExtractValueInst::Create(Ret, 0, "", Term));
231   push(Term->getSuccessor(1), ExtractValueInst::Create(Ret, 1, "", Term));
232 }
233 
234 /// \brief Recursively handle the condition leading to a loop
handleLoopCondition(Value * Cond,PHINode * Broken,llvm::Loop * L,BranchInst * Term)235 Value *SIAnnotateControlFlow::handleLoopCondition(Value *Cond, PHINode *Broken,
236                                              llvm::Loop *L, BranchInst *Term) {
237 
238   // Only search through PHI nodes which are inside the loop.  If we try this
239   // with PHI nodes that are outside of the loop, we end up inserting new PHI
240   // nodes outside of the loop which depend on values defined inside the loop.
241   // This will break the module with
242   // 'Instruction does not dominate all users!' errors.
243   PHINode *Phi = nullptr;
244   if ((Phi = dyn_cast<PHINode>(Cond)) && L->contains(Phi)) {
245 
246     BasicBlock *Parent = Phi->getParent();
247     PHINode *NewPhi = PHINode::Create(Int64, 0, "", &Parent->front());
248     Value *Ret = NewPhi;
249 
250     // Handle all non-constant incoming values first
251     for (unsigned i = 0, e = Phi->getNumIncomingValues(); i != e; ++i) {
252       Value *Incoming = Phi->getIncomingValue(i);
253       BasicBlock *From = Phi->getIncomingBlock(i);
254       if (isa<ConstantInt>(Incoming)) {
255         NewPhi->addIncoming(Broken, From);
256         continue;
257       }
258 
259       Phi->setIncomingValue(i, BoolFalse);
260       Value *PhiArg = handleLoopCondition(Incoming, Broken, L, Term);
261       NewPhi->addIncoming(PhiArg, From);
262     }
263 
264     BasicBlock *IDom = DT->getNode(Parent)->getIDom()->getBlock();
265 
266     for (unsigned i = 0, e = Phi->getNumIncomingValues(); i != e; ++i) {
267 
268       Value *Incoming = Phi->getIncomingValue(i);
269       if (Incoming != BoolTrue)
270         continue;
271 
272       BasicBlock *From = Phi->getIncomingBlock(i);
273       if (From == IDom) {
274         // We're in the following situation:
275         //   IDom/From
276         //      |   \
277         //      |   If-block
278         //      |   /
279         //     Parent
280         // where we want to break out of the loop if the If-block is not taken.
281         // Due to the depth-first traversal, there should be an end.cf
282         // intrinsic in Parent, and we insert an else.break before it.
283         //
284         // Note that the end.cf need not be the first non-phi instruction
285         // of parent, particularly when we're dealing with a multi-level
286         // break, but it should occur within a group of intrinsic calls
287         // at the beginning of the block.
288         CallInst *OldEnd = dyn_cast<CallInst>(Parent->getFirstInsertionPt());
289         while (OldEnd && OldEnd->getCalledFunction() != EndCf)
290           OldEnd = dyn_cast<CallInst>(OldEnd->getNextNode());
291         if (OldEnd && OldEnd->getCalledFunction() == EndCf) {
292           Value *Args[] = { OldEnd->getArgOperand(0), NewPhi };
293           Ret = CallInst::Create(ElseBreak, Args, "", OldEnd);
294           continue;
295         }
296       }
297       TerminatorInst *Insert = From->getTerminator();
298       Value *PhiArg = CallInst::Create(Break, Broken, "", Insert);
299       NewPhi->setIncomingValue(i, PhiArg);
300     }
301     eraseIfUnused(Phi);
302     return Ret;
303 
304   } else if (Instruction *Inst = dyn_cast<Instruction>(Cond)) {
305     BasicBlock *Parent = Inst->getParent();
306     Instruction *Insert;
307     if (L->contains(Inst)) {
308       Insert = Parent->getTerminator();
309     } else {
310       Insert = L->getHeader()->getFirstNonPHIOrDbgOrLifetime();
311     }
312     Value *Args[] = { Cond, Broken };
313     return CallInst::Create(IfBreak, Args, "", Insert);
314 
315   // Insert IfBreak before TERM for constant COND.
316   } else if (isa<ConstantInt>(Cond)) {
317     Value *Args[] = { Cond, Broken };
318     return CallInst::Create(IfBreak, Args, "", Term);
319 
320   } else {
321     llvm_unreachable("Unhandled loop condition!");
322   }
323   return nullptr;
324 }
325 
326 /// \brief Handle a back edge (loop)
handleLoop(BranchInst * Term)327 void SIAnnotateControlFlow::handleLoop(BranchInst *Term) {
328   if (isUniform(Term)) {
329     return;
330   }
331 
332   BasicBlock *BB = Term->getParent();
333   llvm::Loop *L = LI->getLoopFor(BB);
334   BasicBlock *Target = Term->getSuccessor(1);
335   PHINode *Broken = PHINode::Create(Int64, 0, "", &Target->front());
336 
337   Value *Cond = Term->getCondition();
338   Term->setCondition(BoolTrue);
339   Value *Arg = handleLoopCondition(Cond, Broken, L, Term);
340 
341   for (pred_iterator PI = pred_begin(Target), PE = pred_end(Target);
342        PI != PE; ++PI) {
343 
344     Broken->addIncoming(*PI == BB ? Arg : Int64Zero, *PI);
345   }
346 
347   Term->setCondition(CallInst::Create(Loop, Arg, "", Term));
348   push(Term->getSuccessor(0), Arg);
349 }/// \brief Close the last opened control flow
closeControlFlow(BasicBlock * BB)350 void SIAnnotateControlFlow::closeControlFlow(BasicBlock *BB) {
351   llvm::Loop *L = LI->getLoopFor(BB);
352 
353   assert(Stack.back().first == BB);
354 
355   if (L && L->getHeader() == BB) {
356     // We can't insert an EndCF call into a loop header, because it will
357     // get executed on every iteration of the loop, when it should be
358     // executed only once before the loop.
359     SmallVector <BasicBlock*, 8> Latches;
360     L->getLoopLatches(Latches);
361 
362     std::vector<BasicBlock*> Preds;
363     for (pred_iterator PI = pred_begin(BB), PE = pred_end(BB); PI != PE; ++PI) {
364       if (std::find(Latches.begin(), Latches.end(), *PI) == Latches.end())
365         Preds.push_back(*PI);
366     }
367     BB = llvm::SplitBlockPredecessors(BB, Preds, "endcf.split", DT, LI, false);
368   }
369 
370   Value *Exec = popSaved();
371   if (!isa<UndefValue>(Exec))
372     CallInst::Create(EndCf, Exec, "", &*BB->getFirstInsertionPt());
373 }
374 
375 /// \brief Annotate the control flow with intrinsics so the backend can
376 /// recognize if/then/else and loops.
runOnFunction(Function & F)377 bool SIAnnotateControlFlow::runOnFunction(Function &F) {
378 
379   DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
380   LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
381   DA = &getAnalysis<DivergenceAnalysis>();
382 
383   for (df_iterator<BasicBlock *> I = df_begin(&F.getEntryBlock()),
384        E = df_end(&F.getEntryBlock()); I != E; ++I) {
385 
386     BranchInst *Term = dyn_cast<BranchInst>((*I)->getTerminator());
387 
388     if (!Term || Term->isUnconditional()) {
389       if (isTopOfStack(*I))
390         closeControlFlow(*I);
391 
392       continue;
393     }
394 
395     if (I.nodeVisited(Term->getSuccessor(1))) {
396       if (isTopOfStack(*I))
397         closeControlFlow(*I);
398 
399       handleLoop(Term);
400       continue;
401     }
402 
403     if (isTopOfStack(*I)) {
404       PHINode *Phi = dyn_cast<PHINode>(Term->getCondition());
405       if (Phi && Phi->getParent() == *I && isElse(Phi)) {
406         insertElse(Term);
407         eraseIfUnused(Phi);
408         continue;
409       }
410       closeControlFlow(*I);
411     }
412     openIf(Term);
413   }
414 
415   assert(Stack.empty());
416   return true;
417 }
418 
419 /// \brief Create the annotation pass
createSIAnnotateControlFlowPass()420 FunctionPass *llvm::createSIAnnotateControlFlowPass() {
421   return new SIAnnotateControlFlow();
422 }
423