1 //===- llvm/Analysis/LoopInfo.h - Natural Loop Calculator -------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file defines the LoopInfo class that is used to identify natural loops
11 // and determine the loop depth of various nodes of the CFG.  A natural loop
12 // has exactly one entry-point, which is called the header. Note that natural
13 // loops may actually be several loops that share the same header node.
14 //
15 // This analysis calculates the nesting structure of loops in a function.  For
16 // each natural loop identified, this analysis identifies natural loops
17 // contained entirely within the loop and the basic blocks the make up the loop.
18 //
19 // It can calculate on the fly various bits of information, for example:
20 //
21 //  * whether there is a preheader for the loop
22 //  * the number of back edges to the header
23 //  * whether or not a particular block branches out of the loop
24 //  * the successor blocks of the loop
25 //  * the loop depth
26 //  * etc...
27 //
28 // Note that this analysis specifically identifies *Loops* not cycles or SCCs
29 // in the CFG.  There can be strongly connected components in the CFG which
30 // this analysis will not recognize and that will not be represented by a Loop
31 // instance.  In particular, a Loop might be inside such a non-loop SCC, or a
32 // non-loop SCC might contain a sub-SCC which is a Loop.
33 //
34 //===----------------------------------------------------------------------===//
35 
36 #ifndef LLVM_ANALYSIS_LOOPINFO_H
37 #define LLVM_ANALYSIS_LOOPINFO_H
38 
39 #include "llvm/ADT/DenseMap.h"
40 #include "llvm/ADT/DenseSet.h"
41 #include "llvm/ADT/GraphTraits.h"
42 #include "llvm/ADT/SmallPtrSet.h"
43 #include "llvm/ADT/SmallVector.h"
44 #include "llvm/IR/CFG.h"
45 #include "llvm/IR/Instruction.h"
46 #include "llvm/IR/Instructions.h"
47 #include "llvm/IR/PassManager.h"
48 #include "llvm/Pass.h"
49 #include "llvm/Support/Allocator.h"
50 #include <algorithm>
51 #include <utility>
52 
53 namespace llvm {
54 
55 class DominatorTree;
56 class LoopInfo;
57 class Loop;
58 class MDNode;
59 class PHINode;
60 class raw_ostream;
61 template <class N, bool IsPostDom> class DominatorTreeBase;
62 template <class N, class M> class LoopInfoBase;
63 template <class N, class M> class LoopBase;
64 
65 //===----------------------------------------------------------------------===//
66 /// Instances of this class are used to represent loops that are detected in the
67 /// flow graph.
68 ///
69 template <class BlockT, class LoopT> class LoopBase {
70   LoopT *ParentLoop;
71   // Loops contained entirely within this one.
72   std::vector<LoopT *> SubLoops;
73 
74   // The list of blocks in this loop. First entry is the header node.
75   std::vector<BlockT *> Blocks;
76 
77   SmallPtrSet<const BlockT *, 8> DenseBlockSet;
78 
79 #if LLVM_ENABLE_ABI_BREAKING_CHECKS
80   /// Indicator that this loop is no longer a valid loop.
81   bool IsInvalid = false;
82 #endif
83 
84   LoopBase(const LoopBase<BlockT, LoopT> &) = delete;
85   const LoopBase<BlockT, LoopT> &
86   operator=(const LoopBase<BlockT, LoopT> &) = delete;
87 
88 public:
89   /// Return the nesting level of this loop.  An outer-most loop has depth 1,
90   /// for consistency with loop depth values used for basic blocks, where depth
91   /// 0 is used for blocks not inside any loops.
getLoopDepth()92   unsigned getLoopDepth() const {
93     assert(!isInvalid() && "Loop not in a valid state!");
94     unsigned D = 1;
95     for (const LoopT *CurLoop = ParentLoop; CurLoop;
96          CurLoop = CurLoop->ParentLoop)
97       ++D;
98     return D;
99   }
getHeader()100   BlockT *getHeader() const { return getBlocks().front(); }
getParentLoop()101   LoopT *getParentLoop() const { return ParentLoop; }
102 
103   /// This is a raw interface for bypassing addChildLoop.
setParentLoop(LoopT * L)104   void setParentLoop(LoopT *L) {
105     assert(!isInvalid() && "Loop not in a valid state!");
106     ParentLoop = L;
107   }
108 
109   /// Return true if the specified loop is contained within in this loop.
contains(const LoopT * L)110   bool contains(const LoopT *L) const {
111     assert(!isInvalid() && "Loop not in a valid state!");
112     if (L == this)
113       return true;
114     if (!L)
115       return false;
116     return contains(L->getParentLoop());
117   }
118 
119   /// Return true if the specified basic block is in this loop.
contains(const BlockT * BB)120   bool contains(const BlockT *BB) const {
121     assert(!isInvalid() && "Loop not in a valid state!");
122     return DenseBlockSet.count(BB);
123   }
124 
125   /// Return true if the specified instruction is in this loop.
contains(const InstT * Inst)126   template <class InstT> bool contains(const InstT *Inst) const {
127     return contains(Inst->getParent());
128   }
129 
130   /// Return the loops contained entirely within this loop.
getSubLoops()131   const std::vector<LoopT *> &getSubLoops() const {
132     assert(!isInvalid() && "Loop not in a valid state!");
133     return SubLoops;
134   }
getSubLoopsVector()135   std::vector<LoopT *> &getSubLoopsVector() {
136     assert(!isInvalid() && "Loop not in a valid state!");
137     return SubLoops;
138   }
139   typedef typename std::vector<LoopT *>::const_iterator iterator;
140   typedef
141       typename std::vector<LoopT *>::const_reverse_iterator reverse_iterator;
begin()142   iterator begin() const { return getSubLoops().begin(); }
end()143   iterator end() const { return getSubLoops().end(); }
rbegin()144   reverse_iterator rbegin() const { return getSubLoops().rbegin(); }
rend()145   reverse_iterator rend() const { return getSubLoops().rend(); }
empty()146   bool empty() const { return getSubLoops().empty(); }
147 
148   /// Get a list of the basic blocks which make up this loop.
getBlocks()149   ArrayRef<BlockT *> getBlocks() const {
150     assert(!isInvalid() && "Loop not in a valid state!");
151     return Blocks;
152   }
153   typedef typename ArrayRef<BlockT *>::const_iterator block_iterator;
block_begin()154   block_iterator block_begin() const { return getBlocks().begin(); }
block_end()155   block_iterator block_end() const { return getBlocks().end(); }
blocks()156   inline iterator_range<block_iterator> blocks() const {
157     assert(!isInvalid() && "Loop not in a valid state!");
158     return make_range(block_begin(), block_end());
159   }
160 
161   /// Get the number of blocks in this loop in constant time.
162   /// Invalidate the loop, indicating that it is no longer a loop.
getNumBlocks()163   unsigned getNumBlocks() const {
164     assert(!isInvalid() && "Loop not in a valid state!");
165     return Blocks.size();
166   }
167 
168   /// Return a direct, mutable handle to the blocks vector so that we can
169   /// mutate it efficiently with techniques like `std::remove`.
getBlocksVector()170   std::vector<BlockT *> &getBlocksVector() {
171     assert(!isInvalid() && "Loop not in a valid state!");
172     return Blocks;
173   }
174   /// Return a direct, mutable handle to the blocks set so that we can
175   /// mutate it efficiently.
getBlocksSet()176   SmallPtrSetImpl<const BlockT *> &getBlocksSet() {
177     assert(!isInvalid() && "Loop not in a valid state!");
178     return DenseBlockSet;
179   }
180 
181   /// Return a direct, immutable handle to the blocks set.
getBlocksSet()182   const SmallPtrSetImpl<const BlockT *> &getBlocksSet() const {
183     assert(!isInvalid() && "Loop not in a valid state!");
184     return DenseBlockSet;
185   }
186 
187   /// Return true if this loop is no longer valid.  The only valid use of this
188   /// helper is "assert(L.isInvalid())" or equivalent, since IsInvalid is set to
189   /// true by the destructor.  In other words, if this accessor returns true,
190   /// the caller has already triggered UB by calling this accessor; and so it
191   /// can only be called in a context where a return value of true indicates a
192   /// programmer error.
isInvalid()193   bool isInvalid() const {
194 #if LLVM_ENABLE_ABI_BREAKING_CHECKS
195     return IsInvalid;
196 #else
197     return false;
198 #endif
199   }
200 
201   /// True if terminator in the block can branch to another block that is
202   /// outside of the current loop.
isLoopExiting(const BlockT * BB)203   bool isLoopExiting(const BlockT *BB) const {
204     assert(!isInvalid() && "Loop not in a valid state!");
205     for (const auto &Succ : children<const BlockT *>(BB)) {
206       if (!contains(Succ))
207         return true;
208     }
209     return false;
210   }
211 
212   /// Returns true if \p BB is a loop-latch.
213   /// A latch block is a block that contains a branch back to the header.
214   /// This function is useful when there are multiple latches in a loop
215   /// because \fn getLoopLatch will return nullptr in that case.
isLoopLatch(const BlockT * BB)216   bool isLoopLatch(const BlockT *BB) const {
217     assert(!isInvalid() && "Loop not in a valid state!");
218     assert(contains(BB) && "block does not belong to the loop");
219 
220     BlockT *Header = getHeader();
221     auto PredBegin = GraphTraits<Inverse<BlockT *>>::child_begin(Header);
222     auto PredEnd = GraphTraits<Inverse<BlockT *>>::child_end(Header);
223     return std::find(PredBegin, PredEnd, BB) != PredEnd;
224   }
225 
226   /// Calculate the number of back edges to the loop header.
getNumBackEdges()227   unsigned getNumBackEdges() const {
228     assert(!isInvalid() && "Loop not in a valid state!");
229     unsigned NumBackEdges = 0;
230     BlockT *H = getHeader();
231 
232     for (const auto Pred : children<Inverse<BlockT *>>(H))
233       if (contains(Pred))
234         ++NumBackEdges;
235 
236     return NumBackEdges;
237   }
238 
239   //===--------------------------------------------------------------------===//
240   // APIs for simple analysis of the loop.
241   //
242   // Note that all of these methods can fail on general loops (ie, there may not
243   // be a preheader, etc).  For best success, the loop simplification and
244   // induction variable canonicalization pass should be used to normalize loops
245   // for easy analysis.  These methods assume canonical loops.
246 
247   /// Return all blocks inside the loop that have successors outside of the
248   /// loop. These are the blocks _inside of the current loop_ which branch out.
249   /// The returned list is always unique.
250   void getExitingBlocks(SmallVectorImpl<BlockT *> &ExitingBlocks) const;
251 
252   /// If getExitingBlocks would return exactly one block, return that block.
253   /// Otherwise return null.
254   BlockT *getExitingBlock() const;
255 
256   /// Return all of the successor blocks of this loop. These are the blocks
257   /// _outside of the current loop_ which are branched to.
258   void getExitBlocks(SmallVectorImpl<BlockT *> &ExitBlocks) const;
259 
260   /// If getExitBlocks would return exactly one block, return that block.
261   /// Otherwise return null.
262   BlockT *getExitBlock() const;
263 
264   /// Return true if no exit block for the loop has a predecessor that is
265   /// outside the loop.
266   bool hasDedicatedExits() const;
267 
268   /// Return all unique successor blocks of this loop.
269   /// These are the blocks _outside of the current loop_ which are branched to.
270   /// This assumes that loop exits are in canonical form, i.e. all exits are
271   /// dedicated exits.
272   void getUniqueExitBlocks(SmallVectorImpl<BlockT *> &ExitBlocks) const;
273 
274   /// If getUniqueExitBlocks would return exactly one block, return that block.
275   /// Otherwise return null.
276   BlockT *getUniqueExitBlock() const;
277 
278   /// Edge type.
279   typedef std::pair<const BlockT *, const BlockT *> Edge;
280 
281   /// Return all pairs of (_inside_block_,_outside_block_).
282   void getExitEdges(SmallVectorImpl<Edge> &ExitEdges) const;
283 
284   /// If there is a preheader for this loop, return it. A loop has a preheader
285   /// if there is only one edge to the header of the loop from outside of the
286   /// loop. If this is the case, the block branching to the header of the loop
287   /// is the preheader node.
288   ///
289   /// This method returns null if there is no preheader for the loop.
290   BlockT *getLoopPreheader() const;
291 
292   /// If the given loop's header has exactly one unique predecessor outside the
293   /// loop, return it. Otherwise return null.
294   ///  This is less strict that the loop "preheader" concept, which requires
295   /// the predecessor to have exactly one successor.
296   BlockT *getLoopPredecessor() const;
297 
298   /// If there is a single latch block for this loop, return it.
299   /// A latch block is a block that contains a branch back to the header.
300   BlockT *getLoopLatch() const;
301 
302   /// Return all loop latch blocks of this loop. A latch block is a block that
303   /// contains a branch back to the header.
getLoopLatches(SmallVectorImpl<BlockT * > & LoopLatches)304   void getLoopLatches(SmallVectorImpl<BlockT *> &LoopLatches) const {
305     assert(!isInvalid() && "Loop not in a valid state!");
306     BlockT *H = getHeader();
307     for (const auto Pred : children<Inverse<BlockT *>>(H))
308       if (contains(Pred))
309         LoopLatches.push_back(Pred);
310   }
311 
312   //===--------------------------------------------------------------------===//
313   // APIs for updating loop information after changing the CFG
314   //
315 
316   /// This method is used by other analyses to update loop information.
317   /// NewBB is set to be a new member of the current loop.
318   /// Because of this, it is added as a member of all parent loops, and is added
319   /// to the specified LoopInfo object as being in the current basic block.  It
320   /// is not valid to replace the loop header with this method.
321   void addBasicBlockToLoop(BlockT *NewBB, LoopInfoBase<BlockT, LoopT> &LI);
322 
323   /// This is used when splitting loops up. It replaces the OldChild entry in
324   /// our children list with NewChild, and updates the parent pointer of
325   /// OldChild to be null and the NewChild to be this loop.
326   /// This updates the loop depth of the new child.
327   void replaceChildLoopWith(LoopT *OldChild, LoopT *NewChild);
328 
329   /// Add the specified loop to be a child of this loop.
330   /// This updates the loop depth of the new child.
addChildLoop(LoopT * NewChild)331   void addChildLoop(LoopT *NewChild) {
332     assert(!isInvalid() && "Loop not in a valid state!");
333     assert(!NewChild->ParentLoop && "NewChild already has a parent!");
334     NewChild->ParentLoop = static_cast<LoopT *>(this);
335     SubLoops.push_back(NewChild);
336   }
337 
338   /// This removes the specified child from being a subloop of this loop. The
339   /// loop is not deleted, as it will presumably be inserted into another loop.
removeChildLoop(iterator I)340   LoopT *removeChildLoop(iterator I) {
341     assert(!isInvalid() && "Loop not in a valid state!");
342     assert(I != SubLoops.end() && "Cannot remove end iterator!");
343     LoopT *Child = *I;
344     assert(Child->ParentLoop == this && "Child is not a child of this loop!");
345     SubLoops.erase(SubLoops.begin() + (I - begin()));
346     Child->ParentLoop = nullptr;
347     return Child;
348   }
349 
350   /// This removes the specified child from being a subloop of this loop. The
351   /// loop is not deleted, as it will presumably be inserted into another loop.
removeChildLoop(LoopT * Child)352   LoopT *removeChildLoop(LoopT *Child) {
353     return removeChildLoop(llvm::find(*this, Child));
354   }
355 
356   /// This adds a basic block directly to the basic block list.
357   /// This should only be used by transformations that create new loops.  Other
358   /// transformations should use addBasicBlockToLoop.
addBlockEntry(BlockT * BB)359   void addBlockEntry(BlockT *BB) {
360     assert(!isInvalid() && "Loop not in a valid state!");
361     Blocks.push_back(BB);
362     DenseBlockSet.insert(BB);
363   }
364 
365   /// interface to reverse Blocks[from, end of loop] in this loop
reverseBlock(unsigned from)366   void reverseBlock(unsigned from) {
367     assert(!isInvalid() && "Loop not in a valid state!");
368     std::reverse(Blocks.begin() + from, Blocks.end());
369   }
370 
371   /// interface to do reserve() for Blocks
reserveBlocks(unsigned size)372   void reserveBlocks(unsigned size) {
373     assert(!isInvalid() && "Loop not in a valid state!");
374     Blocks.reserve(size);
375   }
376 
377   /// This method is used to move BB (which must be part of this loop) to be the
378   /// loop header of the loop (the block that dominates all others).
moveToHeader(BlockT * BB)379   void moveToHeader(BlockT *BB) {
380     assert(!isInvalid() && "Loop not in a valid state!");
381     if (Blocks[0] == BB)
382       return;
383     for (unsigned i = 0;; ++i) {
384       assert(i != Blocks.size() && "Loop does not contain BB!");
385       if (Blocks[i] == BB) {
386         Blocks[i] = Blocks[0];
387         Blocks[0] = BB;
388         return;
389       }
390     }
391   }
392 
393   /// This removes the specified basic block from the current loop, updating the
394   /// Blocks as appropriate. This does not update the mapping in the LoopInfo
395   /// class.
removeBlockFromLoop(BlockT * BB)396   void removeBlockFromLoop(BlockT *BB) {
397     assert(!isInvalid() && "Loop not in a valid state!");
398     auto I = find(Blocks, BB);
399     assert(I != Blocks.end() && "N is not in this list!");
400     Blocks.erase(I);
401 
402     DenseBlockSet.erase(BB);
403   }
404 
405   /// Verify loop structure
406   void verifyLoop() const;
407 
408   /// Verify loop structure of this loop and all nested loops.
409   void verifyLoopNest(DenseSet<const LoopT *> *Loops) const;
410 
411   /// Print loop with all the BBs inside it.
412   void print(raw_ostream &OS, unsigned Depth = 0, bool Verbose = false) const;
413 
414 protected:
415   friend class LoopInfoBase<BlockT, LoopT>;
416 
417   /// This creates an empty loop.
LoopBase()418   LoopBase() : ParentLoop(nullptr) {}
419 
LoopBase(BlockT * BB)420   explicit LoopBase(BlockT *BB) : ParentLoop(nullptr) {
421     Blocks.push_back(BB);
422     DenseBlockSet.insert(BB);
423   }
424 
425   // Since loop passes like SCEV are allowed to key analysis results off of
426   // `Loop` pointers, we cannot re-use pointers within a loop pass manager.
427   // This means loop passes should not be `delete` ing `Loop` objects directly
428   // (and risk a later `Loop` allocation re-using the address of a previous one)
429   // but should be using LoopInfo::markAsRemoved, which keeps around the `Loop`
430   // pointer till the end of the lifetime of the `LoopInfo` object.
431   //
432   // To make it easier to follow this rule, we mark the destructor as
433   // non-public.
~LoopBase()434   ~LoopBase() {
435     for (auto *SubLoop : SubLoops)
436       SubLoop->~LoopT();
437 
438 #if LLVM_ENABLE_ABI_BREAKING_CHECKS
439     IsInvalid = true;
440 #endif
441     SubLoops.clear();
442     Blocks.clear();
443     DenseBlockSet.clear();
444     ParentLoop = nullptr;
445   }
446 };
447 
448 template <class BlockT, class LoopT>
449 raw_ostream &operator<<(raw_ostream &OS, const LoopBase<BlockT, LoopT> &Loop) {
450   Loop.print(OS);
451   return OS;
452 }
453 
454 // Implementation in LoopInfoImpl.h
455 extern template class LoopBase<BasicBlock, Loop>;
456 
457 /// Represents a single loop in the control flow graph.  Note that not all SCCs
458 /// in the CFG are necessarily loops.
459 class Loop : public LoopBase<BasicBlock, Loop> {
460 public:
461   /// A range representing the start and end location of a loop.
462   class LocRange {
463     DebugLoc Start;
464     DebugLoc End;
465 
466   public:
LocRange()467     LocRange() {}
LocRange(DebugLoc Start)468     LocRange(DebugLoc Start) : Start(std::move(Start)), End(std::move(Start)) {}
LocRange(DebugLoc Start,DebugLoc End)469     LocRange(DebugLoc Start, DebugLoc End)
470         : Start(std::move(Start)), End(std::move(End)) {}
471 
getStart()472     const DebugLoc &getStart() const { return Start; }
getEnd()473     const DebugLoc &getEnd() const { return End; }
474 
475     /// Check for null.
476     ///
477     explicit operator bool() const { return Start && End; }
478   };
479 
480   /// Return true if the specified value is loop invariant.
481   bool isLoopInvariant(const Value *V) const;
482 
483   /// Return true if all the operands of the specified instruction are loop
484   /// invariant.
485   bool hasLoopInvariantOperands(const Instruction *I) const;
486 
487   /// If the given value is an instruction inside of the loop and it can be
488   /// hoisted, do so to make it trivially loop-invariant.
489   /// Return true if the value after any hoisting is loop invariant. This
490   /// function can be used as a slightly more aggressive replacement for
491   /// isLoopInvariant.
492   ///
493   /// If InsertPt is specified, it is the point to hoist instructions to.
494   /// If null, the terminator of the loop preheader is used.
495   bool makeLoopInvariant(Value *V, bool &Changed,
496                          Instruction *InsertPt = nullptr) const;
497 
498   /// If the given instruction is inside of the loop and it can be hoisted, do
499   /// so to make it trivially loop-invariant.
500   /// Return true if the instruction after any hoisting is loop invariant. This
501   /// function can be used as a slightly more aggressive replacement for
502   /// isLoopInvariant.
503   ///
504   /// If InsertPt is specified, it is the point to hoist instructions to.
505   /// If null, the terminator of the loop preheader is used.
506   ///
507   bool makeLoopInvariant(Instruction *I, bool &Changed,
508                          Instruction *InsertPt = nullptr) const;
509 
510   /// Check to see if the loop has a canonical induction variable: an integer
511   /// recurrence that starts at 0 and increments by one each time through the
512   /// loop. If so, return the phi node that corresponds to it.
513   ///
514   /// The IndVarSimplify pass transforms loops to have a canonical induction
515   /// variable.
516   ///
517   PHINode *getCanonicalInductionVariable() const;
518 
519   /// Return true if the Loop is in LCSSA form.
520   bool isLCSSAForm(DominatorTree &DT) const;
521 
522   /// Return true if this Loop and all inner subloops are in LCSSA form.
523   bool isRecursivelyLCSSAForm(DominatorTree &DT, const LoopInfo &LI) const;
524 
525   /// Return true if the Loop is in the form that the LoopSimplify form
526   /// transforms loops to, which is sometimes called normal form.
527   bool isLoopSimplifyForm() const;
528 
529   /// Return true if the loop body is safe to clone in practice.
530   bool isSafeToClone() const;
531 
532   /// Returns true if the loop is annotated parallel.
533   ///
534   /// A parallel loop can be assumed to not contain any dependencies between
535   /// iterations by the compiler. That is, any loop-carried dependency checking
536   /// can be skipped completely when parallelizing the loop on the target
537   /// machine. Thus, if the parallel loop information originates from the
538   /// programmer, e.g. via the OpenMP parallel for pragma, it is the
539   /// programmer's responsibility to ensure there are no loop-carried
540   /// dependencies. The final execution order of the instructions across
541   /// iterations is not guaranteed, thus, the end result might or might not
542   /// implement actual concurrent execution of instructions across multiple
543   /// iterations.
544   bool isAnnotatedParallel() const;
545 
546   /// Return the llvm.loop loop id metadata node for this loop if it is present.
547   ///
548   /// If this loop contains the same llvm.loop metadata on each branch to the
549   /// header then the node is returned. If any latch instruction does not
550   /// contain llvm.loop or if multiple latches contain different nodes then
551   /// 0 is returned.
552   MDNode *getLoopID() const;
553   /// Set the llvm.loop loop id metadata for this loop.
554   ///
555   /// The LoopID metadata node will be added to each terminator instruction in
556   /// the loop that branches to the loop header.
557   ///
558   /// The LoopID metadata node should have one or more operands and the first
559   /// operand should be the node itself.
560   void setLoopID(MDNode *LoopID) const;
561 
562   /// Add llvm.loop.unroll.disable to this loop's loop id metadata.
563   ///
564   /// Remove existing unroll metadata and add unroll disable metadata to
565   /// indicate the loop has already been unrolled.  This prevents a loop
566   /// from being unrolled more than is directed by a pragma if the loop
567   /// unrolling pass is run more than once (which it generally is).
568   void setLoopAlreadyUnrolled();
569 
570   void dump() const;
571   void dumpVerbose() const;
572 
573   /// Return the debug location of the start of this loop.
574   /// This looks for a BB terminating instruction with a known debug
575   /// location by looking at the preheader and header blocks. If it
576   /// cannot find a terminating instruction with location information,
577   /// it returns an unknown location.
578   DebugLoc getStartLoc() const;
579 
580   /// Return the source code span of the loop.
581   LocRange getLocRange() const;
582 
getName()583   StringRef getName() const {
584     if (BasicBlock *Header = getHeader())
585       if (Header->hasName())
586         return Header->getName();
587     return "<unnamed loop>";
588   }
589 
590 private:
591   Loop() = default;
592 
593   friend class LoopInfoBase<BasicBlock, Loop>;
594   friend class LoopBase<BasicBlock, Loop>;
Loop(BasicBlock * BB)595   explicit Loop(BasicBlock *BB) : LoopBase<BasicBlock, Loop>(BB) {}
596   ~Loop() = default;
597 };
598 
599 //===----------------------------------------------------------------------===//
600 /// This class builds and contains all of the top-level loop
601 /// structures in the specified function.
602 ///
603 
604 template <class BlockT, class LoopT> class LoopInfoBase {
605   // BBMap - Mapping of basic blocks to the inner most loop they occur in
606   DenseMap<const BlockT *, LoopT *> BBMap;
607   std::vector<LoopT *> TopLevelLoops;
608   BumpPtrAllocator LoopAllocator;
609 
610   friend class LoopBase<BlockT, LoopT>;
611   friend class LoopInfo;
612 
613   void operator=(const LoopInfoBase &) = delete;
614   LoopInfoBase(const LoopInfoBase &) = delete;
615 
616 public:
LoopInfoBase()617   LoopInfoBase() {}
~LoopInfoBase()618   ~LoopInfoBase() { releaseMemory(); }
619 
LoopInfoBase(LoopInfoBase && Arg)620   LoopInfoBase(LoopInfoBase &&Arg)
621       : BBMap(std::move(Arg.BBMap)),
622         TopLevelLoops(std::move(Arg.TopLevelLoops)),
623         LoopAllocator(std::move(Arg.LoopAllocator)) {
624     // We have to clear the arguments top level loops as we've taken ownership.
625     Arg.TopLevelLoops.clear();
626   }
627   LoopInfoBase &operator=(LoopInfoBase &&RHS) {
628     BBMap = std::move(RHS.BBMap);
629 
630     for (auto *L : TopLevelLoops)
631       L->~LoopT();
632 
633     TopLevelLoops = std::move(RHS.TopLevelLoops);
634     LoopAllocator = std::move(RHS.LoopAllocator);
635     RHS.TopLevelLoops.clear();
636     return *this;
637   }
638 
releaseMemory()639   void releaseMemory() {
640     BBMap.clear();
641 
642     for (auto *L : TopLevelLoops)
643       L->~LoopT();
644     TopLevelLoops.clear();
645     LoopAllocator.Reset();
646   }
647 
AllocateLoop(ArgsTy &&...Args)648   template <typename... ArgsTy> LoopT *AllocateLoop(ArgsTy &&... Args) {
649     LoopT *Storage = LoopAllocator.Allocate<LoopT>();
650     return new (Storage) LoopT(std::forward<ArgsTy>(Args)...);
651   }
652 
653   /// iterator/begin/end - The interface to the top-level loops in the current
654   /// function.
655   ///
656   typedef typename std::vector<LoopT *>::const_iterator iterator;
657   typedef
658       typename std::vector<LoopT *>::const_reverse_iterator reverse_iterator;
begin()659   iterator begin() const { return TopLevelLoops.begin(); }
end()660   iterator end() const { return TopLevelLoops.end(); }
rbegin()661   reverse_iterator rbegin() const { return TopLevelLoops.rbegin(); }
rend()662   reverse_iterator rend() const { return TopLevelLoops.rend(); }
empty()663   bool empty() const { return TopLevelLoops.empty(); }
664 
665   /// Return all of the loops in the function in preorder across the loop
666   /// nests, with siblings in forward program order.
667   ///
668   /// Note that because loops form a forest of trees, preorder is equivalent to
669   /// reverse postorder.
670   SmallVector<LoopT *, 4> getLoopsInPreorder();
671 
672   /// Return all of the loops in the function in preorder across the loop
673   /// nests, with siblings in *reverse* program order.
674   ///
675   /// Note that because loops form a forest of trees, preorder is equivalent to
676   /// reverse postorder.
677   ///
678   /// Also note that this is *not* a reverse preorder. Only the siblings are in
679   /// reverse program order.
680   SmallVector<LoopT *, 4> getLoopsInReverseSiblingPreorder();
681 
682   /// Return the inner most loop that BB lives in. If a basic block is in no
683   /// loop (for example the entry node), null is returned.
getLoopFor(const BlockT * BB)684   LoopT *getLoopFor(const BlockT *BB) const { return BBMap.lookup(BB); }
685 
686   /// Same as getLoopFor.
687   const LoopT *operator[](const BlockT *BB) const { return getLoopFor(BB); }
688 
689   /// Return the loop nesting level of the specified block. A depth of 0 means
690   /// the block is not inside any loop.
getLoopDepth(const BlockT * BB)691   unsigned getLoopDepth(const BlockT *BB) const {
692     const LoopT *L = getLoopFor(BB);
693     return L ? L->getLoopDepth() : 0;
694   }
695 
696   // True if the block is a loop header node
isLoopHeader(const BlockT * BB)697   bool isLoopHeader(const BlockT *BB) const {
698     const LoopT *L = getLoopFor(BB);
699     return L && L->getHeader() == BB;
700   }
701 
702   /// This removes the specified top-level loop from this loop info object.
703   /// The loop is not deleted, as it will presumably be inserted into
704   /// another loop.
removeLoop(iterator I)705   LoopT *removeLoop(iterator I) {
706     assert(I != end() && "Cannot remove end iterator!");
707     LoopT *L = *I;
708     assert(!L->getParentLoop() && "Not a top-level loop!");
709     TopLevelLoops.erase(TopLevelLoops.begin() + (I - begin()));
710     return L;
711   }
712 
713   /// Change the top-level loop that contains BB to the specified loop.
714   /// This should be used by transformations that restructure the loop hierarchy
715   /// tree.
changeLoopFor(BlockT * BB,LoopT * L)716   void changeLoopFor(BlockT *BB, LoopT *L) {
717     if (!L) {
718       BBMap.erase(BB);
719       return;
720     }
721     BBMap[BB] = L;
722   }
723 
724   /// Replace the specified loop in the top-level loops list with the indicated
725   /// loop.
changeTopLevelLoop(LoopT * OldLoop,LoopT * NewLoop)726   void changeTopLevelLoop(LoopT *OldLoop, LoopT *NewLoop) {
727     auto I = find(TopLevelLoops, OldLoop);
728     assert(I != TopLevelLoops.end() && "Old loop not at top level!");
729     *I = NewLoop;
730     assert(!NewLoop->ParentLoop && !OldLoop->ParentLoop &&
731            "Loops already embedded into a subloop!");
732   }
733 
734   /// This adds the specified loop to the collection of top-level loops.
addTopLevelLoop(LoopT * New)735   void addTopLevelLoop(LoopT *New) {
736     assert(!New->getParentLoop() && "Loop already in subloop!");
737     TopLevelLoops.push_back(New);
738   }
739 
740   /// This method completely removes BB from all data structures,
741   /// including all of the Loop objects it is nested in and our mapping from
742   /// BasicBlocks to loops.
removeBlock(BlockT * BB)743   void removeBlock(BlockT *BB) {
744     auto I = BBMap.find(BB);
745     if (I != BBMap.end()) {
746       for (LoopT *L = I->second; L; L = L->getParentLoop())
747         L->removeBlockFromLoop(BB);
748 
749       BBMap.erase(I);
750     }
751   }
752 
753   // Internals
754 
isNotAlreadyContainedIn(const LoopT * SubLoop,const LoopT * ParentLoop)755   static bool isNotAlreadyContainedIn(const LoopT *SubLoop,
756                                       const LoopT *ParentLoop) {
757     if (!SubLoop)
758       return true;
759     if (SubLoop == ParentLoop)
760       return false;
761     return isNotAlreadyContainedIn(SubLoop->getParentLoop(), ParentLoop);
762   }
763 
764   /// Create the loop forest using a stable algorithm.
765   void analyze(const DominatorTreeBase<BlockT, false> &DomTree);
766 
767   // Debugging
768   void print(raw_ostream &OS) const;
769 
770   void verify(const DominatorTreeBase<BlockT, false> &DomTree) const;
771 
772   /// Destroy a loop that has been removed from the `LoopInfo` nest.
773   ///
774   /// This runs the destructor of the loop object making it invalid to
775   /// reference afterward. The memory is retained so that the *pointer* to the
776   /// loop remains valid.
777   ///
778   /// The caller is responsible for removing this loop from the loop nest and
779   /// otherwise disconnecting it from the broader `LoopInfo` data structures.
780   /// Callers that don't naturally handle this themselves should probably call
781   /// `erase' instead.
destroy(LoopT * L)782   void destroy(LoopT *L) {
783     L->~LoopT();
784 
785     // Since LoopAllocator is a BumpPtrAllocator, this Deallocate only poisons
786     // \c L, but the pointer remains valid for non-dereferencing uses.
787     LoopAllocator.Deallocate(L);
788   }
789 };
790 
791 // Implementation in LoopInfoImpl.h
792 extern template class LoopInfoBase<BasicBlock, Loop>;
793 
794 class LoopInfo : public LoopInfoBase<BasicBlock, Loop> {
795   typedef LoopInfoBase<BasicBlock, Loop> BaseT;
796 
797   friend class LoopBase<BasicBlock, Loop>;
798 
799   void operator=(const LoopInfo &) = delete;
800   LoopInfo(const LoopInfo &) = delete;
801 
802 public:
LoopInfo()803   LoopInfo() {}
804   explicit LoopInfo(const DominatorTreeBase<BasicBlock, false> &DomTree);
805 
LoopInfo(LoopInfo && Arg)806   LoopInfo(LoopInfo &&Arg) : BaseT(std::move(static_cast<BaseT &>(Arg))) {}
807   LoopInfo &operator=(LoopInfo &&RHS) {
808     BaseT::operator=(std::move(static_cast<BaseT &>(RHS)));
809     return *this;
810   }
811 
812   /// Handle invalidation explicitly.
813   bool invalidate(Function &F, const PreservedAnalyses &PA,
814                   FunctionAnalysisManager::Invalidator &);
815 
816   // Most of the public interface is provided via LoopInfoBase.
817 
818   /// Update LoopInfo after removing the last backedge from a loop. This updates
819   /// the loop forest and parent loops for each block so that \c L is no longer
820   /// referenced, but does not actually delete \c L immediately. The pointer
821   /// will remain valid until this LoopInfo's memory is released.
822   void erase(Loop *L);
823 
824   /// Returns true if replacing From with To everywhere is guaranteed to
825   /// preserve LCSSA form.
replacementPreservesLCSSAForm(Instruction * From,Value * To)826   bool replacementPreservesLCSSAForm(Instruction *From, Value *To) {
827     // Preserving LCSSA form is only problematic if the replacing value is an
828     // instruction.
829     Instruction *I = dyn_cast<Instruction>(To);
830     if (!I)
831       return true;
832     // If both instructions are defined in the same basic block then replacement
833     // cannot break LCSSA form.
834     if (I->getParent() == From->getParent())
835       return true;
836     // If the instruction is not defined in a loop then it can safely replace
837     // anything.
838     Loop *ToLoop = getLoopFor(I->getParent());
839     if (!ToLoop)
840       return true;
841     // If the replacing instruction is defined in the same loop as the original
842     // instruction, or in a loop that contains it as an inner loop, then using
843     // it as a replacement will not break LCSSA form.
844     return ToLoop->contains(getLoopFor(From->getParent()));
845   }
846 
847   /// Checks if moving a specific instruction can break LCSSA in any loop.
848   ///
849   /// Return true if moving \p Inst to before \p NewLoc will break LCSSA,
850   /// assuming that the function containing \p Inst and \p NewLoc is currently
851   /// in LCSSA form.
movementPreservesLCSSAForm(Instruction * Inst,Instruction * NewLoc)852   bool movementPreservesLCSSAForm(Instruction *Inst, Instruction *NewLoc) {
853     assert(Inst->getFunction() == NewLoc->getFunction() &&
854            "Can't reason about IPO!");
855 
856     auto *OldBB = Inst->getParent();
857     auto *NewBB = NewLoc->getParent();
858 
859     // Movement within the same loop does not break LCSSA (the equality check is
860     // to avoid doing a hashtable lookup in case of intra-block movement).
861     if (OldBB == NewBB)
862       return true;
863 
864     auto *OldLoop = getLoopFor(OldBB);
865     auto *NewLoop = getLoopFor(NewBB);
866 
867     if (OldLoop == NewLoop)
868       return true;
869 
870     // Check if Outer contains Inner; with the null loop counting as the
871     // "outermost" loop.
872     auto Contains = [](const Loop *Outer, const Loop *Inner) {
873       return !Outer || Outer->contains(Inner);
874     };
875 
876     // To check that the movement of Inst to before NewLoc does not break LCSSA,
877     // we need to check two sets of uses for possible LCSSA violations at
878     // NewLoc: the users of NewInst, and the operands of NewInst.
879 
880     // If we know we're hoisting Inst out of an inner loop to an outer loop,
881     // then the uses *of* Inst don't need to be checked.
882 
883     if (!Contains(NewLoop, OldLoop)) {
884       for (Use &U : Inst->uses()) {
885         auto *UI = cast<Instruction>(U.getUser());
886         auto *UBB = isa<PHINode>(UI) ? cast<PHINode>(UI)->getIncomingBlock(U)
887                                      : UI->getParent();
888         if (UBB != NewBB && getLoopFor(UBB) != NewLoop)
889           return false;
890       }
891     }
892 
893     // If we know we're sinking Inst from an outer loop into an inner loop, then
894     // the *operands* of Inst don't need to be checked.
895 
896     if (!Contains(OldLoop, NewLoop)) {
897       // See below on why we can't handle phi nodes here.
898       if (isa<PHINode>(Inst))
899         return false;
900 
901       for (Use &U : Inst->operands()) {
902         auto *DefI = dyn_cast<Instruction>(U.get());
903         if (!DefI)
904           return false;
905 
906         // This would need adjustment if we allow Inst to be a phi node -- the
907         // new use block won't simply be NewBB.
908 
909         auto *DefBlock = DefI->getParent();
910         if (DefBlock != NewBB && getLoopFor(DefBlock) != NewLoop)
911           return false;
912       }
913     }
914 
915     return true;
916   }
917 };
918 
919 // Allow clients to walk the list of nested loops...
920 template <> struct GraphTraits<const Loop *> {
921   typedef const Loop *NodeRef;
922   typedef LoopInfo::iterator ChildIteratorType;
923 
924   static NodeRef getEntryNode(const Loop *L) { return L; }
925   static ChildIteratorType child_begin(NodeRef N) { return N->begin(); }
926   static ChildIteratorType child_end(NodeRef N) { return N->end(); }
927 };
928 
929 template <> struct GraphTraits<Loop *> {
930   typedef Loop *NodeRef;
931   typedef LoopInfo::iterator ChildIteratorType;
932 
933   static NodeRef getEntryNode(Loop *L) { return L; }
934   static ChildIteratorType child_begin(NodeRef N) { return N->begin(); }
935   static ChildIteratorType child_end(NodeRef N) { return N->end(); }
936 };
937 
938 /// Analysis pass that exposes the \c LoopInfo for a function.
939 class LoopAnalysis : public AnalysisInfoMixin<LoopAnalysis> {
940   friend AnalysisInfoMixin<LoopAnalysis>;
941   static AnalysisKey Key;
942 
943 public:
944   typedef LoopInfo Result;
945 
946   LoopInfo run(Function &F, FunctionAnalysisManager &AM);
947 };
948 
949 /// Printer pass for the \c LoopAnalysis results.
950 class LoopPrinterPass : public PassInfoMixin<LoopPrinterPass> {
951   raw_ostream &OS;
952 
953 public:
954   explicit LoopPrinterPass(raw_ostream &OS) : OS(OS) {}
955   PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
956 };
957 
958 /// Verifier pass for the \c LoopAnalysis results.
959 struct LoopVerifierPass : public PassInfoMixin<LoopVerifierPass> {
960   PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
961 };
962 
963 /// The legacy pass manager's analysis pass to compute loop information.
964 class LoopInfoWrapperPass : public FunctionPass {
965   LoopInfo LI;
966 
967 public:
968   static char ID; // Pass identification, replacement for typeid
969 
970   LoopInfoWrapperPass() : FunctionPass(ID) {
971     initializeLoopInfoWrapperPassPass(*PassRegistry::getPassRegistry());
972   }
973 
974   LoopInfo &getLoopInfo() { return LI; }
975   const LoopInfo &getLoopInfo() const { return LI; }
976 
977   /// Calculate the natural loop information for a given function.
978   bool runOnFunction(Function &F) override;
979 
980   void verifyAnalysis() const override;
981 
982   void releaseMemory() override { LI.releaseMemory(); }
983 
984   void print(raw_ostream &O, const Module *M = nullptr) const override;
985 
986   void getAnalysisUsage(AnalysisUsage &AU) const override;
987 };
988 
989 /// Function to print a loop's contents as LLVM's text IR assembly.
990 void printLoop(Loop &L, raw_ostream &OS, const std::string &Banner = "");
991 
992 } // End llvm namespace
993 
994 #endif
995