14ead2cf7SAlex Zinenko //===- SCFToGPUPass.cpp - Convert a loop nest to a GPU kernel -----------===//
24ead2cf7SAlex Zinenko //
34ead2cf7SAlex Zinenko // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
44ead2cf7SAlex Zinenko // See https://llvm.org/LICENSE.txt for license information.
54ead2cf7SAlex Zinenko // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
64ead2cf7SAlex Zinenko //
74ead2cf7SAlex Zinenko //===----------------------------------------------------------------------===//
84ead2cf7SAlex Zinenko
94ead2cf7SAlex Zinenko #include "mlir/Conversion/SCFToGPU/SCFToGPUPass.h"
104ead2cf7SAlex Zinenko #include "../PassDetail.h"
114ead2cf7SAlex Zinenko #include "mlir/Conversion/SCFToGPU/SCFToGPU.h"
124ead2cf7SAlex Zinenko #include "mlir/Dialect/Affine/IR/AffineOps.h"
13a54f4eaeSMogball #include "mlir/Dialect/Arithmetic/IR/Arithmetic.h"
14b1e1bbaeSAlexander Belyaev #include "mlir/Dialect/Complex/IR/Complex.h"
15d7ef488bSMogball #include "mlir/Dialect/GPU/IR/GPUDialect.h"
16*8b68da2cSAlex Zinenko #include "mlir/Dialect/SCF/IR/SCF.h"
174ead2cf7SAlex Zinenko #include "mlir/Transforms/DialectConversion.h"
184ead2cf7SAlex Zinenko
194ead2cf7SAlex Zinenko #include "llvm/ADT/ArrayRef.h"
204ead2cf7SAlex Zinenko #include "llvm/Support/CommandLine.h"
214ead2cf7SAlex Zinenko
224ead2cf7SAlex Zinenko using namespace mlir;
234ead2cf7SAlex Zinenko using namespace mlir::scf;
244ead2cf7SAlex Zinenko
254ead2cf7SAlex Zinenko namespace {
264ead2cf7SAlex Zinenko // A pass that traverses top-level loops in the function and converts them to
274ead2cf7SAlex Zinenko // GPU launch operations. Nested launches are not allowed, so this does not
284ead2cf7SAlex Zinenko // walk the function recursively to avoid considering nested loops.
292bcd1927SMaheshRavishankar struct ForLoopMapper : public ConvertAffineForToGPUBase<ForLoopMapper> {
304ead2cf7SAlex Zinenko ForLoopMapper() = default;
ForLoopMapper__anonb2e6168a0111::ForLoopMapper314ead2cf7SAlex Zinenko ForLoopMapper(unsigned numBlockDims, unsigned numThreadDims) {
324ead2cf7SAlex Zinenko this->numBlockDims = numBlockDims;
334ead2cf7SAlex Zinenko this->numThreadDims = numThreadDims;
344ead2cf7SAlex Zinenko }
354ead2cf7SAlex Zinenko
runOnOperation__anonb2e6168a0111::ForLoopMapper3641574554SRiver Riddle void runOnOperation() override {
3747f175b0SRiver Riddle for (Operation &op :
3847f175b0SRiver Riddle llvm::make_early_inc_range(getOperation().getBody().getOps())) {
394ead2cf7SAlex Zinenko if (auto forOp = dyn_cast<AffineForOp>(&op)) {
404ead2cf7SAlex Zinenko if (failed(convertAffineLoopNestToGPULaunch(forOp, numBlockDims,
414ead2cf7SAlex Zinenko numThreadDims)))
424ead2cf7SAlex Zinenko signalPassFailure();
434ead2cf7SAlex Zinenko }
444ead2cf7SAlex Zinenko }
454ead2cf7SAlex Zinenko }
464ead2cf7SAlex Zinenko };
474ead2cf7SAlex Zinenko
484ead2cf7SAlex Zinenko struct ParallelLoopToGpuPass
494ead2cf7SAlex Zinenko : public ConvertParallelLoopToGpuBase<ParallelLoopToGpuPass> {
runOnOperation__anonb2e6168a0111::ParallelLoopToGpuPass504ead2cf7SAlex Zinenko void runOnOperation() override {
51dc4e913bSChris Lattner RewritePatternSet patterns(&getContext());
523a506b31SChris Lattner populateParallelLoopToGPUPatterns(patterns);
534ead2cf7SAlex Zinenko ConversionTarget target(getContext());
5433a58c1cSStephan Herhut target.markUnknownOpDynamicallyLegal([](Operation *) { return true; });
555da2423bSStephan Herhut configureParallelLoopToGPULegality(target);
563fffffa8SRiver Riddle if (failed(applyPartialConversion(getOperation(), target,
573fffffa8SRiver Riddle std::move(patterns))))
584ead2cf7SAlex Zinenko signalPassFailure();
59ec03bbe8SVladislav Vinogradov finalizeParallelLoopToGPUConversion(getOperation());
604ead2cf7SAlex Zinenko }
614ead2cf7SAlex Zinenko };
624ead2cf7SAlex Zinenko
634ead2cf7SAlex Zinenko } // namespace
644ead2cf7SAlex Zinenko
6547f175b0SRiver Riddle std::unique_ptr<InterfacePass<FunctionOpInterface>>
createAffineForToGPUPass(unsigned numBlockDims,unsigned numThreadDims)662bcd1927SMaheshRavishankar mlir::createAffineForToGPUPass(unsigned numBlockDims, unsigned numThreadDims) {
674ead2cf7SAlex Zinenko return std::make_unique<ForLoopMapper>(numBlockDims, numThreadDims);
684ead2cf7SAlex Zinenko }
6947f175b0SRiver Riddle std::unique_ptr<InterfacePass<FunctionOpInterface>>
createAffineForToGPUPass()7047f175b0SRiver Riddle mlir::createAffineForToGPUPass() {
714ead2cf7SAlex Zinenko return std::make_unique<ForLoopMapper>();
724ead2cf7SAlex Zinenko }
734ead2cf7SAlex Zinenko
createParallelLoopToGpuPass()744ead2cf7SAlex Zinenko std::unique_ptr<Pass> mlir::createParallelLoopToGpuPass() {
754ead2cf7SAlex Zinenko return std::make_unique<ParallelLoopToGpuPass>();
764ead2cf7SAlex Zinenko }
77