1b8737614SUday Bondhugula //===- LoopUnroll.cpp - Code to perform loop unrolling --------------------===//
2b8737614SUday Bondhugula //
3b8737614SUday Bondhugula // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4b8737614SUday Bondhugula // See https://llvm.org/LICENSE.txt for license information.
5b8737614SUday Bondhugula // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6b8737614SUday Bondhugula //
7b8737614SUday Bondhugula //===----------------------------------------------------------------------===//
8b8737614SUday Bondhugula //
9b8737614SUday Bondhugula // This file implements loop unrolling.
10b8737614SUday Bondhugula //
11b8737614SUday Bondhugula //===----------------------------------------------------------------------===//
121834ad4aSRiver Riddle #include "PassDetail.h"
13755dc07dSRiver Riddle #include "mlir/Dialect/Affine/Analysis/LoopAnalysis.h"
14b8737614SUday Bondhugula #include "mlir/Dialect/Affine/IR/AffineOps.h"
15a70aa7bbSRiver Riddle #include "mlir/Dialect/Affine/LoopUtils.h"
16b8737614SUday Bondhugula #include "mlir/Dialect/Affine/Passes.h"
17b8737614SUday Bondhugula #include "mlir/IR/AffineExpr.h"
18b8737614SUday Bondhugula #include "mlir/IR/AffineMap.h"
19b8737614SUday Bondhugula #include "mlir/IR/Builders.h"
20b8737614SUday Bondhugula #include "llvm/ADT/DenseMap.h"
21b8737614SUday Bondhugula #include "llvm/Support/CommandLine.h"
22b8737614SUday Bondhugula #include "llvm/Support/Debug.h"
23b8737614SUday Bondhugula
24b8737614SUday Bondhugula using namespace mlir;
25b8737614SUday Bondhugula
26b8737614SUday Bondhugula #define DEBUG_TYPE "affine-loop-unroll"
27b8737614SUday Bondhugula
28b8737614SUday Bondhugula namespace {
29e1fb9d53SUday Bondhugula
30e1fb9d53SUday Bondhugula // TODO: this is really a test pass and should be moved out of dialect
31e1fb9d53SUday Bondhugula // transforms.
32e1fb9d53SUday Bondhugula
33b8737614SUday Bondhugula /// Loop unrolling pass. Unrolls all innermost loops unless full unrolling and a
34b8737614SUday Bondhugula /// full unroll threshold was specified, in which case, fully unrolls all loops
35b8737614SUday Bondhugula /// with trip count less than the specified threshold. The latter is for testing
36b8737614SUday Bondhugula /// purposes, especially for testing outer loop unrolling.
371834ad4aSRiver Riddle struct LoopUnroll : public AffineLoopUnrollBase<LoopUnroll> {
38b8737614SUday Bondhugula // Callback to obtain unroll factors; if this has a callable target, takes
39b8737614SUday Bondhugula // precedence over command-line argument or passed argument.
40b8737614SUday Bondhugula const std::function<unsigned(AffineForOp)> getUnrollFactor;
41b8737614SUday Bondhugula
LoopUnroll__anon71bca16a0111::LoopUnroll42400ad6f9SRiver Riddle LoopUnroll() : getUnrollFactor(nullptr) {}
43400ad6f9SRiver Riddle LoopUnroll(const LoopUnroll &other)
44e5639b3fSMehdi Amini
45e5639b3fSMehdi Amini = default;
LoopUnroll__anon71bca16a0111::LoopUnroll46b8737614SUday Bondhugula explicit LoopUnroll(
47e2394245SLubomir Litchev Optional<unsigned> unrollFactor = None, bool unrollUpToFactor = false,
48e2394245SLubomir Litchev bool unrollFull = false,
49b8737614SUday Bondhugula const std::function<unsigned(AffineForOp)> &getUnrollFactor = nullptr)
50400ad6f9SRiver Riddle : getUnrollFactor(getUnrollFactor) {
51400ad6f9SRiver Riddle if (unrollFactor)
52400ad6f9SRiver Riddle this->unrollFactor = *unrollFactor;
53e2394245SLubomir Litchev this->unrollUpToFactor = unrollUpToFactor;
54400ad6f9SRiver Riddle this->unrollFull = unrollFull;
55400ad6f9SRiver Riddle }
56b8737614SUday Bondhugula
5741574554SRiver Riddle void runOnOperation() override;
58b8737614SUday Bondhugula
59b8737614SUday Bondhugula /// Unroll this for op. Returns failure if nothing was done.
60b8737614SUday Bondhugula LogicalResult runOnAffineForOp(AffineForOp forOp);
61b8737614SUday Bondhugula };
62be0a7e9fSMehdi Amini } // namespace
63b8737614SUday Bondhugula
64da93537bSUday Bondhugula /// Returns true if no other affine.for ops are nested within `op`.
isInnermostAffineForOp(AffineForOp op)65da93537bSUday Bondhugula static bool isInnermostAffineForOp(AffineForOp op) {
66da93537bSUday Bondhugula return !op.getBody()
67da93537bSUday Bondhugula ->walk([&](AffineForOp nestedForOp) {
68e1fb9d53SUday Bondhugula return WalkResult::interrupt();
69da93537bSUday Bondhugula })
70da93537bSUday Bondhugula .wasInterrupted();
71e1fb9d53SUday Bondhugula }
72e1fb9d53SUday Bondhugula
73e1fb9d53SUday Bondhugula /// Gathers loops that have no affine.for's nested within.
gatherInnermostLoops(func::FuncOp f,SmallVectorImpl<AffineForOp> & loops)7458ceae95SRiver Riddle static void gatherInnermostLoops(func::FuncOp f,
75e1fb9d53SUday Bondhugula SmallVectorImpl<AffineForOp> &loops) {
76e1fb9d53SUday Bondhugula f.walk([&](AffineForOp forOp) {
77e1fb9d53SUday Bondhugula if (isInnermostAffineForOp(forOp))
78e1fb9d53SUday Bondhugula loops.push_back(forOp);
79e1fb9d53SUday Bondhugula });
80e1fb9d53SUday Bondhugula }
81e1fb9d53SUday Bondhugula
runOnOperation()8241574554SRiver Riddle void LoopUnroll::runOnOperation() {
8358ceae95SRiver Riddle func::FuncOp func = getOperation();
8441574554SRiver Riddle if (func.isExternal())
8541574554SRiver Riddle return;
8641574554SRiver Riddle
87400ad6f9SRiver Riddle if (unrollFull && unrollFullThreshold.hasValue()) {
88b8737614SUday Bondhugula // Store short loops as we walk.
89e1fb9d53SUday Bondhugula SmallVector<AffineForOp, 4> loops;
90b8737614SUday Bondhugula
91b8737614SUday Bondhugula // Gathers all loops with trip count <= minTripCount. Do a post order walk
92b8737614SUday Bondhugula // so that loops are gathered from innermost to outermost (or else unrolling
93b8737614SUday Bondhugula // an outer one may delete gathered inner ones).
9441574554SRiver Riddle getOperation().walk([&](AffineForOp forOp) {
95b8737614SUday Bondhugula Optional<uint64_t> tripCount = getConstantTripCount(forOp);
96*037f0995SKazu Hirata if (tripCount && *tripCount <= unrollFullThreshold)
97b8737614SUday Bondhugula loops.push_back(forOp);
98b8737614SUday Bondhugula });
99b8737614SUday Bondhugula for (auto forOp : loops)
100e21adfa3SRiver Riddle (void)loopUnrollFull(forOp);
101b8737614SUday Bondhugula return;
102b8737614SUday Bondhugula }
103b8737614SUday Bondhugula
104b8737614SUday Bondhugula // If the call back is provided, we will recurse until no loops are found.
105e1fb9d53SUday Bondhugula SmallVector<AffineForOp, 4> loops;
106b8737614SUday Bondhugula for (unsigned i = 0; i < numRepetitions || getUnrollFactor; i++) {
107e1fb9d53SUday Bondhugula loops.clear();
108e1fb9d53SUday Bondhugula gatherInnermostLoops(func, loops);
109b8737614SUday Bondhugula if (loops.empty())
110b8737614SUday Bondhugula break;
111b8737614SUday Bondhugula bool unrolled = false;
112b8737614SUday Bondhugula for (auto forOp : loops)
113b8737614SUday Bondhugula unrolled |= succeeded(runOnAffineForOp(forOp));
114b8737614SUday Bondhugula if (!unrolled)
115b8737614SUday Bondhugula // Break out if nothing was unrolled.
116b8737614SUday Bondhugula break;
117b8737614SUday Bondhugula }
118b8737614SUday Bondhugula }
119b8737614SUday Bondhugula
120b8737614SUday Bondhugula /// Unrolls a 'affine.for' op. Returns success if the loop was unrolled,
121b8737614SUday Bondhugula /// failure otherwise. The default unroll factor is 4.
runOnAffineForOp(AffineForOp forOp)122b8737614SUday Bondhugula LogicalResult LoopUnroll::runOnAffineForOp(AffineForOp forOp) {
123b8737614SUday Bondhugula // Use the function callback if one was provided.
124400ad6f9SRiver Riddle if (getUnrollFactor)
125b8737614SUday Bondhugula return loopUnrollByFactor(forOp, getUnrollFactor(forOp));
126b8737614SUday Bondhugula // Unroll completely if full loop unroll was specified.
127400ad6f9SRiver Riddle if (unrollFull)
128b8737614SUday Bondhugula return loopUnrollFull(forOp);
129400ad6f9SRiver Riddle // Otherwise, unroll by the given unroll factor.
13032062478SLubomir Litchev if (unrollUpToFactor)
131e2394245SLubomir Litchev return loopUnrollUpToFactor(forOp, unrollFactor);
132400ad6f9SRiver Riddle return loopUnrollByFactor(forOp, unrollFactor);
133b8737614SUday Bondhugula }
134b8737614SUday Bondhugula
createLoopUnrollPass(int unrollFactor,bool unrollUpToFactor,bool unrollFull,const std::function<unsigned (AffineForOp)> & getUnrollFactor)13558ceae95SRiver Riddle std::unique_ptr<OperationPass<func::FuncOp>> mlir::createLoopUnrollPass(
136e2394245SLubomir Litchev int unrollFactor, bool unrollUpToFactor, bool unrollFull,
137b8737614SUday Bondhugula const std::function<unsigned(AffineForOp)> &getUnrollFactor) {
138b8737614SUday Bondhugula return std::make_unique<LoopUnroll>(
139e2394245SLubomir Litchev unrollFactor == -1 ? None : Optional<unsigned>(unrollFactor),
140e2394245SLubomir Litchev unrollUpToFactor, unrollFull, getUnrollFactor);
141b8737614SUday Bondhugula }
142