1 //===- GreedyPatternRewriteDriver.cpp - A greedy rewriter -----------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements mlir::applyPatternsAndFoldGreedily.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "mlir/Transforms/GreedyPatternRewriteDriver.h"
14 #include "mlir/Interfaces/SideEffectInterfaces.h"
15 #include "mlir/Rewrite/PatternApplicator.h"
16 #include "mlir/Transforms/FoldUtils.h"
17 #include "mlir/Transforms/RegionUtils.h"
18 #include "llvm/ADT/DenseMap.h"
19 #include "llvm/Support/CommandLine.h"
20 #include "llvm/Support/Debug.h"
21 #include "llvm/Support/raw_ostream.h"
22 
23 using namespace mlir;
24 
25 #define DEBUG_TYPE "pattern-matcher"
26 
27 /// The max number of iterations scanning for pattern match.
28 static unsigned maxPatternMatchIterations = 10;
29 
30 //===----------------------------------------------------------------------===//
31 // GreedyPatternRewriteDriver
32 //===----------------------------------------------------------------------===//
33 
34 namespace {
35 /// This is a worklist-driven driver for the PatternMatcher, which repeatedly
36 /// applies the locally optimal patterns in a roughly "bottom up" way.
37 class GreedyPatternRewriteDriver : public PatternRewriter {
38 public:
39   explicit GreedyPatternRewriteDriver(MLIRContext *ctx,
40                                       const FrozenRewritePatternList &patterns)
41       : PatternRewriter(ctx), matcher(patterns), folder(ctx) {
42     worklist.reserve(64);
43 
44     // Apply a simple cost model based solely on pattern benefit.
45     matcher.applyDefaultCostModel();
46   }
47 
48   bool simplify(MutableArrayRef<Region> regions, int maxIterations);
49 
50   void addToWorklist(Operation *op) {
51     // Check to see if the worklist already contains this op.
52     if (worklistMap.count(op))
53       return;
54 
55     worklistMap[op] = worklist.size();
56     worklist.push_back(op);
57   }
58 
59   Operation *popFromWorklist() {
60     auto *op = worklist.back();
61     worklist.pop_back();
62 
63     // This operation is no longer in the worklist, keep worklistMap up to date.
64     if (op)
65       worklistMap.erase(op);
66     return op;
67   }
68 
69   /// If the specified operation is in the worklist, remove it.  If not, this is
70   /// a no-op.
71   void removeFromWorklist(Operation *op) {
72     auto it = worklistMap.find(op);
73     if (it != worklistMap.end()) {
74       assert(worklist[it->second] == op && "malformed worklist data structure");
75       worklist[it->second] = nullptr;
76       worklistMap.erase(it);
77     }
78   }
79 
80   // These are hooks implemented for PatternRewriter.
81 protected:
82   // Implement the hook for inserting operations, and make sure that newly
83   // inserted ops are added to the worklist for processing.
84   void notifyOperationInserted(Operation *op) override { addToWorklist(op); }
85 
86   // If an operation is about to be removed, make sure it is not in our
87   // worklist anymore because we'd get dangling references to it.
88   void notifyOperationRemoved(Operation *op) override {
89     addToWorklist(op->getOperands());
90     op->walk([this](Operation *operation) {
91       removeFromWorklist(operation);
92       folder.notifyRemoval(operation);
93     });
94   }
95 
96   // When the root of a pattern is about to be replaced, it can trigger
97   // simplifications to its users - make sure to add them to the worklist
98   // before the root is changed.
99   void notifyRootReplaced(Operation *op) override {
100     for (auto result : op->getResults())
101       for (auto *user : result.getUsers())
102         addToWorklist(user);
103   }
104 
105 private:
106   // Look over the provided operands for any defining operations that should
107   // be re-added to the worklist. This function should be called when an
108   // operation is modified or removed, as it may trigger further
109   // simplifications.
110   template <typename Operands>
111   void addToWorklist(Operands &&operands) {
112     for (Value operand : operands) {
113       // If the use count of this operand is now < 2, we re-add the defining
114       // operation to the worklist.
115       // TODO: This is based on the fact that zero use operations
116       // may be deleted, and that single use values often have more
117       // canonicalization opportunities.
118       if (!operand.use_empty() && !operand.hasOneUse())
119         continue;
120       if (auto *defInst = operand.getDefiningOp())
121         addToWorklist(defInst);
122     }
123   }
124 
125   /// The low-level pattern applicator.
126   PatternApplicator matcher;
127 
128   /// The worklist for this transformation keeps track of the operations that
129   /// need to be revisited, plus their index in the worklist.  This allows us to
130   /// efficiently remove operations from the worklist when they are erased, even
131   /// if they aren't the root of a pattern.
132   std::vector<Operation *> worklist;
133   DenseMap<Operation *, unsigned> worklistMap;
134 
135   /// Non-pattern based folder for operations.
136   OperationFolder folder;
137 };
138 } // end anonymous namespace
139 
140 /// Performs the rewrites while folding and erasing any dead ops. Returns true
141 /// if the rewrite converges in `maxIterations`.
142 bool GreedyPatternRewriteDriver::simplify(MutableArrayRef<Region> regions,
143                                           int maxIterations) {
144   // Perform a prepass over the IR to discover constants.
145   for (auto &region : regions)
146     folder.processExistingConstants(region);
147 
148   bool changed = false;
149   int iteration = 0;
150   do {
151     assert(worklist.empty() &&
152            "Each iteration should start with empty worklist");
153 
154     // Add all nested operations to the worklist in preorder.
155     for (auto &region : regions)
156       region.walk<WalkOrder::PreOrder>(
157           [this](Operation *op) { worklist.push_back(op); });
158 
159     // Reverse the list so our pop-back loop processes them in-order.
160     std::reverse(worklist.begin(), worklist.end());
161     // Remember the reverse index.
162     for (unsigned i = 0, e = worklist.size(); i != e; ++i)
163       worklistMap[worklist[i]] = i;
164 
165     // These are scratch vectors used in the folding loop below.
166     SmallVector<Value, 8> originalOperands, resultValues;
167 
168     changed = false;
169     while (!worklist.empty()) {
170       auto *op = popFromWorklist();
171 
172       // Nulls get added to the worklist when operations are removed, ignore
173       // them.
174       if (op == nullptr)
175         continue;
176 
177       // If the operation is trivially dead - remove it.
178       if (isOpTriviallyDead(op)) {
179         notifyOperationRemoved(op);
180         op->erase();
181         changed = true;
182         continue;
183       }
184 
185       // Collects all the operands and result uses of the given `op` into work
186       // list. Also remove `op` and nested ops from worklist.
187       originalOperands.assign(op->operand_begin(), op->operand_end());
188       auto preReplaceAction = [&](Operation *op) {
189         // Add the operands to the worklist for visitation.
190         addToWorklist(originalOperands);
191 
192         // Add all the users of the result to the worklist so we make sure
193         // to revisit them.
194         for (auto result : op->getResults())
195           for (auto *userOp : result.getUsers())
196             addToWorklist(userOp);
197 
198         notifyOperationRemoved(op);
199       };
200 
201       // Add the given operation to the worklist.
202       auto collectOps = [this](Operation *op) { addToWorklist(op); };
203 
204       // Try to fold this op.
205       bool inPlaceUpdate;
206       if ((succeeded(folder.tryToFold(op, collectOps, preReplaceAction,
207                                       &inPlaceUpdate)))) {
208         changed = true;
209         if (!inPlaceUpdate)
210           continue;
211       }
212 
213       // Try to match one of the patterns. The rewriter is automatically
214       // notified of any necessary changes, so there is nothing else to do here.
215       changed |= succeeded(matcher.matchAndRewrite(op, *this));
216     }
217 
218     // After applying patterns, make sure that the CFG of each of the regions is
219     // kept up to date.
220     if (succeeded(simplifyRegions(regions))) {
221       folder.clear();
222       changed = true;
223     }
224   } while (changed && ++iteration < maxIterations);
225   // Whether the rewrite converges, i.e. wasn't changed in the last iteration.
226   return !changed;
227 }
228 
229 /// Rewrite the regions of the specified operation, which must be isolated from
230 /// above, by repeatedly applying the highest benefit patterns in a greedy
231 /// work-list driven manner. Return success if no more patterns can be matched
232 /// in the result operation regions. Note: This does not apply patterns to the
233 /// top-level operation itself.
234 ///
235 LogicalResult
236 mlir::applyPatternsAndFoldGreedily(Operation *op,
237                                    const FrozenRewritePatternList &patterns) {
238   return applyPatternsAndFoldGreedily(op, patterns, maxPatternMatchIterations);
239 }
240 LogicalResult
241 mlir::applyPatternsAndFoldGreedily(Operation *op,
242                                    const FrozenRewritePatternList &patterns,
243                                    unsigned maxIterations) {
244   return applyPatternsAndFoldGreedily(op->getRegions(), patterns,
245                                       maxIterations);
246 }
247 /// Rewrite the given regions, which must be isolated from above.
248 LogicalResult
249 mlir::applyPatternsAndFoldGreedily(MutableArrayRef<Region> regions,
250                                    const FrozenRewritePatternList &patterns) {
251   return applyPatternsAndFoldGreedily(regions, patterns,
252                                       maxPatternMatchIterations);
253 }
254 LogicalResult
255 mlir::applyPatternsAndFoldGreedily(MutableArrayRef<Region> regions,
256                                    const FrozenRewritePatternList &patterns,
257                                    unsigned maxIterations) {
258   if (regions.empty())
259     return success();
260 
261   // The top-level operation must be known to be isolated from above to
262   // prevent performing canonicalizations on operations defined at or above
263   // the region containing 'op'.
264   auto regionIsIsolated = [](Region &region) {
265     return region.getParentOp()->hasTrait<OpTrait::IsIsolatedFromAbove>();
266   };
267   (void)regionIsIsolated;
268   assert(llvm::all_of(regions, regionIsIsolated) &&
269          "patterns can only be applied to operations IsolatedFromAbove");
270 
271   // Start the pattern driver.
272   GreedyPatternRewriteDriver driver(regions[0].getContext(), patterns);
273   bool converged = driver.simplify(regions, maxIterations);
274   LLVM_DEBUG(if (!converged) {
275     llvm::dbgs() << "The pattern rewrite doesn't converge after scanning "
276                  << maxIterations << " times\n";
277   });
278   return success(converged);
279 }
280 
281 //===----------------------------------------------------------------------===//
282 // OpPatternRewriteDriver
283 //===----------------------------------------------------------------------===//
284 
285 namespace {
286 /// This is a simple driver for the PatternMatcher to apply patterns and perform
287 /// folding on a single op. It repeatedly applies locally optimal patterns.
288 class OpPatternRewriteDriver : public PatternRewriter {
289 public:
290   explicit OpPatternRewriteDriver(MLIRContext *ctx,
291                                   const FrozenRewritePatternList &patterns)
292       : PatternRewriter(ctx), matcher(patterns), folder(ctx) {
293     // Apply a simple cost model based solely on pattern benefit.
294     matcher.applyDefaultCostModel();
295   }
296 
297   /// Performs the rewrites and folding only on `op`. The simplification
298   /// converges if the op is erased as a result of being folded, replaced, or
299   /// dead, or no more changes happen in an iteration. Returns success if the
300   /// rewrite converges in `maxIterations`. `erased` is set to true if `op` gets
301   /// erased.
302   LogicalResult simplifyLocally(Operation *op, int maxIterations, bool &erased);
303 
304   // These are hooks implemented for PatternRewriter.
305 protected:
306   /// If an operation is about to be removed, mark it so that we can let clients
307   /// know.
308   void notifyOperationRemoved(Operation *op) override {
309     opErasedViaPatternRewrites = true;
310   }
311 
312   // When a root is going to be replaced, its removal will be notified as well.
313   // So there is nothing to do here.
314   void notifyRootReplaced(Operation *op) override {}
315 
316 private:
317   /// The low-level pattern applicator.
318   PatternApplicator matcher;
319 
320   /// Non-pattern based folder for operations.
321   OperationFolder folder;
322 
323   /// Set to true if the operation has been erased via pattern rewrites.
324   bool opErasedViaPatternRewrites = false;
325 };
326 
327 } // anonymous namespace
328 
329 LogicalResult OpPatternRewriteDriver::simplifyLocally(Operation *op,
330                                                       int maxIterations,
331                                                       bool &erased) {
332   bool changed = false;
333   erased = false;
334   opErasedViaPatternRewrites = false;
335   int i = 0;
336   // Iterate until convergence or until maxIterations. Deletion of the op as
337   // a result of being dead or folded is convergence.
338   do {
339     changed = false;
340 
341     // If the operation is trivially dead - remove it.
342     if (isOpTriviallyDead(op)) {
343       op->erase();
344       erased = true;
345       return success();
346     }
347 
348     // Try to fold this op.
349     bool inPlaceUpdate;
350     if (succeeded(folder.tryToFold(op, /*processGeneratedConstants=*/nullptr,
351                                    /*preReplaceAction=*/nullptr,
352                                    &inPlaceUpdate))) {
353       changed = true;
354       if (!inPlaceUpdate) {
355         erased = true;
356         return success();
357       }
358     }
359 
360     // Try to match one of the patterns. The rewriter is automatically
361     // notified of any necessary changes, so there is nothing else to do here.
362     changed |= succeeded(matcher.matchAndRewrite(op, *this));
363     if ((erased = opErasedViaPatternRewrites))
364       return success();
365   } while (changed && ++i < maxIterations);
366 
367   // Whether the rewrite converges, i.e. wasn't changed in the last iteration.
368   return failure(changed);
369 }
370 
371 /// Rewrites only `op` using the supplied canonicalization patterns and
372 /// folding. `erased` is set to true if the op is erased as a result of being
373 /// folded, replaced, or dead.
374 LogicalResult mlir::applyOpPatternsAndFold(
375     Operation *op, const FrozenRewritePatternList &patterns, bool *erased) {
376   // Start the pattern driver.
377   OpPatternRewriteDriver driver(op->getContext(), patterns);
378   bool opErased;
379   LogicalResult converged =
380       driver.simplifyLocally(op, maxPatternMatchIterations, opErased);
381   if (erased)
382     *erased = opErased;
383   LLVM_DEBUG(if (failed(converged)) {
384     llvm::dbgs() << "The pattern rewrite doesn't converge after scanning "
385                  << maxPatternMatchIterations << " times";
386   });
387   return converged;
388 }
389