1 //===- GreedyPatternRewriteDriver.cpp - A greedy rewriter -----------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements mlir::applyPatternsAndFoldGreedily.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "mlir/Transforms/GreedyPatternRewriteDriver.h"
14 #include "mlir/Interfaces/SideEffectInterfaces.h"
15 #include "mlir/Rewrite/PatternApplicator.h"
16 #include "mlir/Transforms/FoldUtils.h"
17 #include "mlir/Transforms/RegionUtils.h"
18 #include "llvm/ADT/DenseMap.h"
19 #include "llvm/Support/CommandLine.h"
20 #include "llvm/Support/Debug.h"
21 #include "llvm/Support/raw_ostream.h"
22 
23 using namespace mlir;
24 
25 #define DEBUG_TYPE "pattern-matcher"
26 
27 /// The max number of iterations scanning for pattern match.
28 static unsigned maxPatternMatchIterations = 10;
29 
30 //===----------------------------------------------------------------------===//
31 // GreedyPatternRewriteDriver
32 //===----------------------------------------------------------------------===//
33 
34 namespace {
35 /// This is a worklist-driven driver for the PatternMatcher, which repeatedly
36 /// applies the locally optimal patterns in a roughly "bottom up" way.
37 class GreedyPatternRewriteDriver : public PatternRewriter {
38 public:
GreedyPatternRewriteDriver(MLIRContext * ctx,const FrozenRewritePatternList & patterns)39   explicit GreedyPatternRewriteDriver(MLIRContext *ctx,
40                                       const FrozenRewritePatternList &patterns)
41       : PatternRewriter(ctx), matcher(patterns), folder(ctx) {
42     worklist.reserve(64);
43 
44     // Apply a simple cost model based solely on pattern benefit.
45     matcher.applyDefaultCostModel();
46   }
47 
48   bool simplify(MutableArrayRef<Region> regions, int maxIterations);
49 
addToWorklist(Operation * op)50   void addToWorklist(Operation *op) {
51     // Check to see if the worklist already contains this op.
52     if (worklistMap.count(op))
53       return;
54 
55     worklistMap[op] = worklist.size();
56     worklist.push_back(op);
57   }
58 
popFromWorklist()59   Operation *popFromWorklist() {
60     auto *op = worklist.back();
61     worklist.pop_back();
62 
63     // This operation is no longer in the worklist, keep worklistMap up to date.
64     if (op)
65       worklistMap.erase(op);
66     return op;
67   }
68 
69   /// If the specified operation is in the worklist, remove it.  If not, this is
70   /// a no-op.
removeFromWorklist(Operation * op)71   void removeFromWorklist(Operation *op) {
72     auto it = worklistMap.find(op);
73     if (it != worklistMap.end()) {
74       assert(worklist[it->second] == op && "malformed worklist data structure");
75       worklist[it->second] = nullptr;
76       worklistMap.erase(it);
77     }
78   }
79 
80   // These are hooks implemented for PatternRewriter.
81 protected:
82   // Implement the hook for inserting operations, and make sure that newly
83   // inserted ops are added to the worklist for processing.
notifyOperationInserted(Operation * op)84   void notifyOperationInserted(Operation *op) override { addToWorklist(op); }
85 
86   // If an operation is about to be removed, make sure it is not in our
87   // worklist anymore because we'd get dangling references to it.
notifyOperationRemoved(Operation * op)88   void notifyOperationRemoved(Operation *op) override {
89     addToWorklist(op->getOperands());
90     op->walk([this](Operation *operation) {
91       removeFromWorklist(operation);
92       folder.notifyRemoval(operation);
93     });
94   }
95 
96   // When the root of a pattern is about to be replaced, it can trigger
97   // simplifications to its users - make sure to add them to the worklist
98   // before the root is changed.
notifyRootReplaced(Operation * op)99   void notifyRootReplaced(Operation *op) override {
100     for (auto result : op->getResults())
101       for (auto *user : result.getUsers())
102         addToWorklist(user);
103   }
104 
105 private:
106   // Look over the provided operands for any defining operations that should
107   // be re-added to the worklist. This function should be called when an
108   // operation is modified or removed, as it may trigger further
109   // simplifications.
addToWorklist(Operands && operands)110   template <typename Operands> void addToWorklist(Operands &&operands) {
111     for (Value operand : operands) {
112       // If the use count of this operand is now < 2, we re-add the defining
113       // operation to the worklist.
114       // TODO: This is based on the fact that zero use operations
115       // may be deleted, and that single use values often have more
116       // canonicalization opportunities.
117       if (!operand.use_empty() && !operand.hasOneUse())
118         continue;
119       if (auto *defInst = operand.getDefiningOp())
120         addToWorklist(defInst);
121     }
122   }
123 
124   /// The low-level pattern applicator.
125   PatternApplicator matcher;
126 
127   /// The worklist for this transformation keeps track of the operations that
128   /// need to be revisited, plus their index in the worklist.  This allows us to
129   /// efficiently remove operations from the worklist when they are erased, even
130   /// if they aren't the root of a pattern.
131   std::vector<Operation *> worklist;
132   DenseMap<Operation *, unsigned> worklistMap;
133 
134   /// Non-pattern based folder for operations.
135   OperationFolder folder;
136 };
137 } // end anonymous namespace
138 
139 /// Performs the rewrites while folding and erasing any dead ops. Returns true
140 /// if the rewrite converges in `maxIterations`.
simplify(MutableArrayRef<Region> regions,int maxIterations)141 bool GreedyPatternRewriteDriver::simplify(MutableArrayRef<Region> regions,
142                                           int maxIterations) {
143   // Add the given operation to the worklist.
144   auto collectOps = [this](Operation *op) { addToWorklist(op); };
145 
146   bool changed = false;
147   int i = 0;
148   do {
149     // Add all nested operations to the worklist.
150     for (auto &region : regions)
151       region.walk(collectOps);
152 
153     // These are scratch vectors used in the folding loop below.
154     SmallVector<Value, 8> originalOperands, resultValues;
155 
156     changed = false;
157     while (!worklist.empty()) {
158       auto *op = popFromWorklist();
159 
160       // Nulls get added to the worklist when operations are removed, ignore
161       // them.
162       if (op == nullptr)
163         continue;
164 
165       // If the operation is trivially dead - remove it.
166       if (isOpTriviallyDead(op)) {
167         notifyOperationRemoved(op);
168         op->erase();
169         changed = true;
170         continue;
171       }
172 
173       // Collects all the operands and result uses of the given `op` into work
174       // list. Also remove `op` and nested ops from worklist.
175       originalOperands.assign(op->operand_begin(), op->operand_end());
176       auto preReplaceAction = [&](Operation *op) {
177         // Add the operands to the worklist for visitation.
178         addToWorklist(originalOperands);
179 
180         // Add all the users of the result to the worklist so we make sure
181         // to revisit them.
182         for (auto result : op->getResults())
183           for (auto *userOp : result.getUsers())
184             addToWorklist(userOp);
185 
186         notifyOperationRemoved(op);
187       };
188 
189       // Try to fold this op.
190       bool inPlaceUpdate;
191       if ((succeeded(folder.tryToFold(op, collectOps, preReplaceAction,
192                                       &inPlaceUpdate)))) {
193         changed = true;
194         if (!inPlaceUpdate)
195           continue;
196       }
197 
198       // Try to match one of the patterns. The rewriter is automatically
199       // notified of any necessary changes, so there is nothing else to do here.
200       changed |= succeeded(matcher.matchAndRewrite(op, *this));
201     }
202 
203     // After applying patterns, make sure that the CFG of each of the regions is
204     // kept up to date.
205     if (succeeded(simplifyRegions(regions))) {
206       folder.clear();
207       changed = true;
208     }
209   } while (changed && ++i < maxIterations);
210   // Whether the rewrite converges, i.e. wasn't changed in the last iteration.
211   return !changed;
212 }
213 
214 /// Rewrite the regions of the specified operation, which must be isolated from
215 /// above, by repeatedly applying the highest benefit patterns in a greedy
216 /// work-list driven manner. Return success if no more patterns can be matched
217 /// in the result operation regions. Note: This does not apply patterns to the
218 /// top-level operation itself.
219 ///
220 LogicalResult
applyPatternsAndFoldGreedily(Operation * op,const FrozenRewritePatternList & patterns)221 mlir::applyPatternsAndFoldGreedily(Operation *op,
222                                    const FrozenRewritePatternList &patterns) {
223   return applyPatternsAndFoldGreedily(op, patterns, maxPatternMatchIterations);
224 }
225 LogicalResult
applyPatternsAndFoldGreedily(Operation * op,const FrozenRewritePatternList & patterns,unsigned maxIterations)226 mlir::applyPatternsAndFoldGreedily(Operation *op,
227                                    const FrozenRewritePatternList &patterns,
228                                    unsigned maxIterations) {
229   return applyPatternsAndFoldGreedily(op->getRegions(), patterns,
230                                       maxIterations);
231 }
232 /// Rewrite the given regions, which must be isolated from above.
233 LogicalResult
applyPatternsAndFoldGreedily(MutableArrayRef<Region> regions,const FrozenRewritePatternList & patterns)234 mlir::applyPatternsAndFoldGreedily(MutableArrayRef<Region> regions,
235                                    const FrozenRewritePatternList &patterns) {
236   return applyPatternsAndFoldGreedily(regions, patterns,
237                                       maxPatternMatchIterations);
238 }
239 LogicalResult
applyPatternsAndFoldGreedily(MutableArrayRef<Region> regions,const FrozenRewritePatternList & patterns,unsigned maxIterations)240 mlir::applyPatternsAndFoldGreedily(MutableArrayRef<Region> regions,
241                                    const FrozenRewritePatternList &patterns,
242                                    unsigned maxIterations) {
243   if (regions.empty())
244     return success();
245 
246   // The top-level operation must be known to be isolated from above to
247   // prevent performing canonicalizations on operations defined at or above
248   // the region containing 'op'.
249   auto regionIsIsolated = [](Region &region) {
250     return region.getParentOp()->isKnownIsolatedFromAbove();
251   };
252   (void)regionIsIsolated;
253   assert(llvm::all_of(regions, regionIsIsolated) &&
254          "patterns can only be applied to operations IsolatedFromAbove");
255 
256   // Start the pattern driver.
257   GreedyPatternRewriteDriver driver(regions[0].getContext(), patterns);
258   bool converged = driver.simplify(regions, maxIterations);
259   LLVM_DEBUG(if (!converged) {
260     llvm::dbgs() << "The pattern rewrite doesn't converge after scanning "
261                  << maxIterations << " times";
262   });
263   return success(converged);
264 }
265 
266 //===----------------------------------------------------------------------===//
267 // OpPatternRewriteDriver
268 //===----------------------------------------------------------------------===//
269 
270 namespace {
271 /// This is a simple driver for the PatternMatcher to apply patterns and perform
272 /// folding on a single op. It repeatedly applies locally optimal patterns.
273 class OpPatternRewriteDriver : public PatternRewriter {
274 public:
OpPatternRewriteDriver(MLIRContext * ctx,const FrozenRewritePatternList & patterns)275   explicit OpPatternRewriteDriver(MLIRContext *ctx,
276                                   const FrozenRewritePatternList &patterns)
277       : PatternRewriter(ctx), matcher(patterns), folder(ctx) {
278     // Apply a simple cost model based solely on pattern benefit.
279     matcher.applyDefaultCostModel();
280   }
281 
282   /// Performs the rewrites and folding only on `op`. The simplification
283   /// converges if the op is erased as a result of being folded, replaced, or
284   /// dead, or no more changes happen in an iteration. Returns success if the
285   /// rewrite converges in `maxIterations`. `erased` is set to true if `op` gets
286   /// erased.
287   LogicalResult simplifyLocally(Operation *op, int maxIterations, bool &erased);
288 
289   // These are hooks implemented for PatternRewriter.
290 protected:
291   /// If an operation is about to be removed, mark it so that we can let clients
292   /// know.
notifyOperationRemoved(Operation * op)293   void notifyOperationRemoved(Operation *op) override {
294     opErasedViaPatternRewrites = true;
295   }
296 
297   // When a root is going to be replaced, its removal will be notified as well.
298   // So there is nothing to do here.
notifyRootReplaced(Operation * op)299   void notifyRootReplaced(Operation *op) override {}
300 
301 private:
302   /// The low-level pattern applicator.
303   PatternApplicator matcher;
304 
305   /// Non-pattern based folder for operations.
306   OperationFolder folder;
307 
308   /// Set to true if the operation has been erased via pattern rewrites.
309   bool opErasedViaPatternRewrites = false;
310 };
311 
312 } // anonymous namespace
313 
simplifyLocally(Operation * op,int maxIterations,bool & erased)314 LogicalResult OpPatternRewriteDriver::simplifyLocally(Operation *op,
315                                                       int maxIterations,
316                                                       bool &erased) {
317   bool changed = false;
318   erased = false;
319   opErasedViaPatternRewrites = false;
320   int i = 0;
321   // Iterate until convergence or until maxIterations. Deletion of the op as
322   // a result of being dead or folded is convergence.
323   do {
324     changed = false;
325 
326     // If the operation is trivially dead - remove it.
327     if (isOpTriviallyDead(op)) {
328       op->erase();
329       erased = true;
330       return success();
331     }
332 
333     // Try to fold this op.
334     bool inPlaceUpdate;
335     if (succeeded(folder.tryToFold(op, /*processGeneratedConstants=*/nullptr,
336                                    /*preReplaceAction=*/nullptr,
337                                    &inPlaceUpdate))) {
338       changed = true;
339       if (!inPlaceUpdate) {
340         erased = true;
341         return success();
342       }
343     }
344 
345     // Try to match one of the patterns. The rewriter is automatically
346     // notified of any necessary changes, so there is nothing else to do here.
347     changed |= succeeded(matcher.matchAndRewrite(op, *this));
348     if ((erased = opErasedViaPatternRewrites))
349       return success();
350   } while (changed && ++i < maxIterations);
351 
352   // Whether the rewrite converges, i.e. wasn't changed in the last iteration.
353   return failure(changed);
354 }
355 
356 /// Rewrites only `op` using the supplied canonicalization patterns and
357 /// folding. `erased` is set to true if the op is erased as a result of being
358 /// folded, replaced, or dead.
applyOpPatternsAndFold(Operation * op,const FrozenRewritePatternList & patterns,bool * erased)359 LogicalResult mlir::applyOpPatternsAndFold(
360     Operation *op, const FrozenRewritePatternList &patterns, bool *erased) {
361   // Start the pattern driver.
362   OpPatternRewriteDriver driver(op->getContext(), patterns);
363   bool opErased;
364   LogicalResult converged =
365       driver.simplifyLocally(op, maxPatternMatchIterations, opErased);
366   if (erased)
367     *erased = opErased;
368   LLVM_DEBUG(if (failed(converged)) {
369     llvm::dbgs() << "The pattern rewrite doesn't converge after scanning "
370                  << maxPatternMatchIterations << " times";
371   });
372   return converged;
373 }
374