1 //===- GreedyPatternRewriteDriver.cpp - A greedy rewriter -----------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file implements mlir::applyPatternsAndFoldGreedily. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "mlir/Transforms/GreedyPatternRewriteDriver.h" 14 #include "mlir/Interfaces/SideEffectInterfaces.h" 15 #include "mlir/Rewrite/PatternApplicator.h" 16 #include "mlir/Transforms/FoldUtils.h" 17 #include "mlir/Transforms/RegionUtils.h" 18 #include "llvm/ADT/DenseMap.h" 19 #include "llvm/Support/CommandLine.h" 20 #include "llvm/Support/Debug.h" 21 #include "llvm/Support/raw_ostream.h" 22 23 using namespace mlir; 24 25 #define DEBUG_TYPE "pattern-matcher" 26 27 /// The max number of iterations scanning for pattern match. 28 static unsigned maxPatternMatchIterations = 10; 29 30 //===----------------------------------------------------------------------===// 31 // GreedyPatternRewriteDriver 32 //===----------------------------------------------------------------------===// 33 34 namespace { 35 /// This is a worklist-driven driver for the PatternMatcher, which repeatedly 36 /// applies the locally optimal patterns in a roughly "bottom up" way. 37 class GreedyPatternRewriteDriver : public PatternRewriter { 38 public: 39 explicit GreedyPatternRewriteDriver(MLIRContext *ctx, 40 const FrozenRewritePatternList &patterns) 41 : PatternRewriter(ctx), matcher(patterns), folder(ctx) { 42 worklist.reserve(64); 43 44 // Apply a simple cost model based solely on pattern benefit. 45 matcher.applyDefaultCostModel(); 46 } 47 48 bool simplify(MutableArrayRef<Region> regions, int maxIterations); 49 50 void addToWorklist(Operation *op) { 51 // Check to see if the worklist already contains this op. 52 if (worklistMap.count(op)) 53 return; 54 55 worklistMap[op] = worklist.size(); 56 worklist.push_back(op); 57 } 58 59 Operation *popFromWorklist() { 60 auto *op = worklist.back(); 61 worklist.pop_back(); 62 63 // This operation is no longer in the worklist, keep worklistMap up to date. 64 if (op) 65 worklistMap.erase(op); 66 return op; 67 } 68 69 /// If the specified operation is in the worklist, remove it. If not, this is 70 /// a no-op. 71 void removeFromWorklist(Operation *op) { 72 auto it = worklistMap.find(op); 73 if (it != worklistMap.end()) { 74 assert(worklist[it->second] == op && "malformed worklist data structure"); 75 worklist[it->second] = nullptr; 76 worklistMap.erase(it); 77 } 78 } 79 80 // These are hooks implemented for PatternRewriter. 81 protected: 82 // Implement the hook for inserting operations, and make sure that newly 83 // inserted ops are added to the worklist for processing. 84 void notifyOperationInserted(Operation *op) override { addToWorklist(op); } 85 86 // If an operation is about to be removed, make sure it is not in our 87 // worklist anymore because we'd get dangling references to it. 88 void notifyOperationRemoved(Operation *op) override { 89 addToWorklist(op->getOperands()); 90 op->walk([this](Operation *operation) { 91 removeFromWorklist(operation); 92 folder.notifyRemoval(operation); 93 }); 94 } 95 96 // When the root of a pattern is about to be replaced, it can trigger 97 // simplifications to its users - make sure to add them to the worklist 98 // before the root is changed. 99 void notifyRootReplaced(Operation *op) override { 100 for (auto result : op->getResults()) 101 for (auto *user : result.getUsers()) 102 addToWorklist(user); 103 } 104 105 private: 106 // Look over the provided operands for any defining operations that should 107 // be re-added to the worklist. This function should be called when an 108 // operation is modified or removed, as it may trigger further 109 // simplifications. 110 template <typename Operands> 111 void addToWorklist(Operands &&operands) { 112 for (Value operand : operands) { 113 // If the use count of this operand is now < 2, we re-add the defining 114 // operation to the worklist. 115 // TODO: This is based on the fact that zero use operations 116 // may be deleted, and that single use values often have more 117 // canonicalization opportunities. 118 if (!operand.use_empty() && !operand.hasOneUse()) 119 continue; 120 if (auto *defInst = operand.getDefiningOp()) 121 addToWorklist(defInst); 122 } 123 } 124 125 /// The low-level pattern applicator. 126 PatternApplicator matcher; 127 128 /// The worklist for this transformation keeps track of the operations that 129 /// need to be revisited, plus their index in the worklist. This allows us to 130 /// efficiently remove operations from the worklist when they are erased, even 131 /// if they aren't the root of a pattern. 132 std::vector<Operation *> worklist; 133 DenseMap<Operation *, unsigned> worklistMap; 134 135 /// Non-pattern based folder for operations. 136 OperationFolder folder; 137 }; 138 } // end anonymous namespace 139 140 /// Performs the rewrites while folding and erasing any dead ops. Returns true 141 /// if the rewrite converges in `maxIterations`. 142 bool GreedyPatternRewriteDriver::simplify(MutableArrayRef<Region> regions, 143 int maxIterations) { 144 // Perform a prepass over the IR to discover constants. 145 for (auto ®ion : regions) 146 folder.processExistingConstants(region); 147 148 bool changed = false; 149 int iteration = 0; 150 do { 151 assert(worklist.empty() && 152 "Each iteration should start with empty worklist"); 153 154 // Add all nested operations to the worklist in preorder. 155 for (auto ®ion : regions) 156 region.walk<WalkOrder::PreOrder>( 157 [this](Operation *op) { worklist.push_back(op); }); 158 159 // Reverse the list so our pop-back loop processes them in-order. 160 std::reverse(worklist.begin(), worklist.end()); 161 // Remember the reverse index. 162 for (unsigned i = 0, e = worklist.size(); i != e; ++i) 163 worklistMap[worklist[i]] = i; 164 165 // These are scratch vectors used in the folding loop below. 166 SmallVector<Value, 8> originalOperands, resultValues; 167 168 changed = false; 169 while (!worklist.empty()) { 170 auto *op = popFromWorklist(); 171 172 // Nulls get added to the worklist when operations are removed, ignore 173 // them. 174 if (op == nullptr) 175 continue; 176 177 // If the operation is trivially dead - remove it. 178 if (isOpTriviallyDead(op)) { 179 notifyOperationRemoved(op); 180 op->erase(); 181 changed = true; 182 continue; 183 } 184 185 // Collects all the operands and result uses of the given `op` into work 186 // list. Also remove `op` and nested ops from worklist. 187 originalOperands.assign(op->operand_begin(), op->operand_end()); 188 auto preReplaceAction = [&](Operation *op) { 189 // Add the operands to the worklist for visitation. 190 addToWorklist(originalOperands); 191 192 // Add all the users of the result to the worklist so we make sure 193 // to revisit them. 194 for (auto result : op->getResults()) 195 for (auto *userOp : result.getUsers()) 196 addToWorklist(userOp); 197 198 notifyOperationRemoved(op); 199 }; 200 201 // Add the given operation to the worklist. 202 auto collectOps = [this](Operation *op) { addToWorklist(op); }; 203 204 // Try to fold this op. 205 bool inPlaceUpdate; 206 if ((succeeded(folder.tryToFold(op, collectOps, preReplaceAction, 207 &inPlaceUpdate)))) { 208 changed = true; 209 if (!inPlaceUpdate) 210 continue; 211 } 212 213 // Try to match one of the patterns. The rewriter is automatically 214 // notified of any necessary changes, so there is nothing else to do here. 215 changed |= succeeded(matcher.matchAndRewrite(op, *this)); 216 } 217 218 // After applying patterns, make sure that the CFG of each of the regions is 219 // kept up to date. 220 if (succeeded(simplifyRegions(regions))) { 221 folder.clear(); 222 changed = true; 223 } 224 } while (changed && ++iteration < maxIterations); 225 // Whether the rewrite converges, i.e. wasn't changed in the last iteration. 226 return !changed; 227 } 228 229 /// Rewrite the regions of the specified operation, which must be isolated from 230 /// above, by repeatedly applying the highest benefit patterns in a greedy 231 /// work-list driven manner. Return success if no more patterns can be matched 232 /// in the result operation regions. Note: This does not apply patterns to the 233 /// top-level operation itself. 234 /// 235 LogicalResult 236 mlir::applyPatternsAndFoldGreedily(Operation *op, 237 const FrozenRewritePatternList &patterns) { 238 return applyPatternsAndFoldGreedily(op, patterns, maxPatternMatchIterations); 239 } 240 LogicalResult 241 mlir::applyPatternsAndFoldGreedily(Operation *op, 242 const FrozenRewritePatternList &patterns, 243 unsigned maxIterations) { 244 return applyPatternsAndFoldGreedily(op->getRegions(), patterns, 245 maxIterations); 246 } 247 /// Rewrite the given regions, which must be isolated from above. 248 LogicalResult 249 mlir::applyPatternsAndFoldGreedily(MutableArrayRef<Region> regions, 250 const FrozenRewritePatternList &patterns) { 251 return applyPatternsAndFoldGreedily(regions, patterns, 252 maxPatternMatchIterations); 253 } 254 LogicalResult 255 mlir::applyPatternsAndFoldGreedily(MutableArrayRef<Region> regions, 256 const FrozenRewritePatternList &patterns, 257 unsigned maxIterations) { 258 if (regions.empty()) 259 return success(); 260 261 // The top-level operation must be known to be isolated from above to 262 // prevent performing canonicalizations on operations defined at or above 263 // the region containing 'op'. 264 auto regionIsIsolated = [](Region ®ion) { 265 return region.getParentOp()->hasTrait<OpTrait::IsIsolatedFromAbove>(); 266 }; 267 (void)regionIsIsolated; 268 assert(llvm::all_of(regions, regionIsIsolated) && 269 "patterns can only be applied to operations IsolatedFromAbove"); 270 271 // Start the pattern driver. 272 GreedyPatternRewriteDriver driver(regions[0].getContext(), patterns); 273 bool converged = driver.simplify(regions, maxIterations); 274 LLVM_DEBUG(if (!converged) { 275 llvm::dbgs() << "The pattern rewrite doesn't converge after scanning " 276 << maxIterations << " times\n"; 277 }); 278 return success(converged); 279 } 280 281 //===----------------------------------------------------------------------===// 282 // OpPatternRewriteDriver 283 //===----------------------------------------------------------------------===// 284 285 namespace { 286 /// This is a simple driver for the PatternMatcher to apply patterns and perform 287 /// folding on a single op. It repeatedly applies locally optimal patterns. 288 class OpPatternRewriteDriver : public PatternRewriter { 289 public: 290 explicit OpPatternRewriteDriver(MLIRContext *ctx, 291 const FrozenRewritePatternList &patterns) 292 : PatternRewriter(ctx), matcher(patterns), folder(ctx) { 293 // Apply a simple cost model based solely on pattern benefit. 294 matcher.applyDefaultCostModel(); 295 } 296 297 /// Performs the rewrites and folding only on `op`. The simplification 298 /// converges if the op is erased as a result of being folded, replaced, or 299 /// dead, or no more changes happen in an iteration. Returns success if the 300 /// rewrite converges in `maxIterations`. `erased` is set to true if `op` gets 301 /// erased. 302 LogicalResult simplifyLocally(Operation *op, int maxIterations, bool &erased); 303 304 // These are hooks implemented for PatternRewriter. 305 protected: 306 /// If an operation is about to be removed, mark it so that we can let clients 307 /// know. 308 void notifyOperationRemoved(Operation *op) override { 309 opErasedViaPatternRewrites = true; 310 } 311 312 // When a root is going to be replaced, its removal will be notified as well. 313 // So there is nothing to do here. 314 void notifyRootReplaced(Operation *op) override {} 315 316 private: 317 /// The low-level pattern applicator. 318 PatternApplicator matcher; 319 320 /// Non-pattern based folder for operations. 321 OperationFolder folder; 322 323 /// Set to true if the operation has been erased via pattern rewrites. 324 bool opErasedViaPatternRewrites = false; 325 }; 326 327 } // anonymous namespace 328 329 LogicalResult OpPatternRewriteDriver::simplifyLocally(Operation *op, 330 int maxIterations, 331 bool &erased) { 332 bool changed = false; 333 erased = false; 334 opErasedViaPatternRewrites = false; 335 int i = 0; 336 // Iterate until convergence or until maxIterations. Deletion of the op as 337 // a result of being dead or folded is convergence. 338 do { 339 changed = false; 340 341 // If the operation is trivially dead - remove it. 342 if (isOpTriviallyDead(op)) { 343 op->erase(); 344 erased = true; 345 return success(); 346 } 347 348 // Try to fold this op. 349 bool inPlaceUpdate; 350 if (succeeded(folder.tryToFold(op, /*processGeneratedConstants=*/nullptr, 351 /*preReplaceAction=*/nullptr, 352 &inPlaceUpdate))) { 353 changed = true; 354 if (!inPlaceUpdate) { 355 erased = true; 356 return success(); 357 } 358 } 359 360 // Try to match one of the patterns. The rewriter is automatically 361 // notified of any necessary changes, so there is nothing else to do here. 362 changed |= succeeded(matcher.matchAndRewrite(op, *this)); 363 if ((erased = opErasedViaPatternRewrites)) 364 return success(); 365 } while (changed && ++i < maxIterations); 366 367 // Whether the rewrite converges, i.e. wasn't changed in the last iteration. 368 return failure(changed); 369 } 370 371 /// Rewrites only `op` using the supplied canonicalization patterns and 372 /// folding. `erased` is set to true if the op is erased as a result of being 373 /// folded, replaced, or dead. 374 LogicalResult mlir::applyOpPatternsAndFold( 375 Operation *op, const FrozenRewritePatternList &patterns, bool *erased) { 376 // Start the pattern driver. 377 OpPatternRewriteDriver driver(op->getContext(), patterns); 378 bool opErased; 379 LogicalResult converged = 380 driver.simplifyLocally(op, maxPatternMatchIterations, opErased); 381 if (erased) 382 *erased = opErased; 383 LLVM_DEBUG(if (failed(converged)) { 384 llvm::dbgs() << "The pattern rewrite doesn't converge after scanning " 385 << maxPatternMatchIterations << " times"; 386 }); 387 return converged; 388 } 389