//===- ShapeToStandard.cpp - conversion from Shape to Standard dialect ----===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "mlir/Conversion/ShapeToStandard/ShapeToStandard.h" #include "../PassDetail.h" #include "mlir/Dialect/Arithmetic/IR/Arithmetic.h" #include "mlir/Dialect/SCF/SCF.h" #include "mlir/Dialect/Shape/IR/Shape.h" #include "mlir/Dialect/StandardOps/IR/Ops.h" #include "mlir/Dialect/Tensor/IR/Tensor.h" #include "mlir/IR/BlockAndValueMapping.h" #include "mlir/IR/ImplicitLocOpBuilder.h" #include "mlir/Transforms/DialectConversion.h" #include "llvm/ADT/STLExtras.h" using namespace mlir; using namespace mlir::shape; using namespace mlir::scf; /// Conversion patterns. namespace { class AnyOpConversion : public OpConversionPattern { public: using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(AnyOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; } // namespace LogicalResult AnyOpConversion::matchAndRewrite(AnyOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { // Replace `any` with its first operand. // Any operand would be a valid substitution. rewriter.replaceOp(op, {adaptor.getInputs().front()}); return success(); } namespace { template class BinaryOpConversion : public OpConversionPattern { public: using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(SrcOpTy op, typename SrcOpTy::Adaptor adaptor, ConversionPatternRewriter &rewriter) const override { // For now, only error-free types are supported by this lowering. if (op.getType().template isa()) return failure(); rewriter.replaceOpWithNewOp(op, adaptor.getLhs(), adaptor.getRhs()); return success(); } }; } // namespace namespace { struct BroadcastOpConverter : public OpConversionPattern { using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(BroadcastOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; // Get the resulting extent in a given dimension. This is computed with any // number of extent tensors and shifted offsets into them. Value getBroadcastedDim(ImplicitLocOpBuilder lb, ValueRange extentTensors, ValueRange rankDiffs, Value outputDimension) { Value one = lb.create(1); Value broadcastedDim = one; for (auto tup : llvm::zip(extentTensors, rankDiffs)) { Value shape = std::get<0>(tup); Value rankDiff = std::get<1>(tup); Value outOfBounds = lb.create(arith::CmpIPredicate::ult, outputDimension, rankDiff); Type indexTy = lb.getIndexType(); broadcastedDim = lb.create( TypeRange{indexTy}, outOfBounds, [&](OpBuilder &b, Location loc) { b.create(loc, broadcastedDim); }, [&](OpBuilder &b, Location loc) { // The broadcasting logic is: // - if one extent (here we arbitrarily choose the // extent from the greater-rank operand) is equal to 1, // then take the extent from the other operand // - otherwise, take the extent as-is. // Note that this logic remains correct in the presence // of dimensions of zero extent. Value lesserRankOperandDimension = b.create( loc, indexTy, outputDimension, rankDiff); Value lesserRankOperandExtent = b.create( loc, shape, ValueRange{lesserRankOperandDimension}); Value dimIsOne = b.create(loc, arith::CmpIPredicate::eq, lesserRankOperandExtent, one); Value dim = b.create(loc, dimIsOne, broadcastedDim, lesserRankOperandExtent); b.create(loc, dim); }) .getResult(0); } return broadcastedDim; } } // namespace LogicalResult BroadcastOpConverter::matchAndRewrite( BroadcastOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { // For now, this lowering is only defined on `tensor` operands, not // on shapes. if (op.getType().isa()) return failure(); auto loc = op.getLoc(); ImplicitLocOpBuilder lb(loc, rewriter); Value zero = lb.create(0); Type indexTy = lb.getIndexType(); // Save all the ranks for bounds checking. Because this is a tensor // representing the shape extents, the rank is the extent of the only // dimension in the tensor. SmallVector ranks, rankDiffs; llvm::append_range(ranks, llvm::map_range(adaptor.getShapes(), [&](Value v) { return lb.create(v, zero); })); // Find the maximum rank Value maxRank = ranks.front(); for (Value v : llvm::drop_begin(ranks, 1)) { Value rankIsGreater = lb.create(arith::CmpIPredicate::ugt, v, maxRank); maxRank = lb.create(rankIsGreater, v, maxRank); } // Calculate the difference of ranks and the maximum rank for later offsets. llvm::append_range(rankDiffs, llvm::map_range(ranks, [&](Value v) { return lb.create(indexTy, maxRank, v); })); Value replacement = lb.create( getExtentTensorType(lb.getContext()), ValueRange{maxRank}, [&](OpBuilder &b, Location loc, ValueRange args) { Value broadcastedDim = getBroadcastedDim(ImplicitLocOpBuilder(loc, b), adaptor.getShapes(), rankDiffs, args[0]); b.create(loc, broadcastedDim); }); if (replacement.getType() != op.getType()) replacement = lb.create(op.getType(), replacement); rewriter.replaceOp(op, replacement); return success(); } namespace { class ConstShapeOpConverter : public OpConversionPattern { public: using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(ConstShapeOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; } // namespace LogicalResult ConstShapeOpConverter::matchAndRewrite( ConstShapeOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { // For now, this lowering supports only extent tensors, not `shape.shape` // types. if (op.getType().isa()) return failure(); auto loc = op.getLoc(); SmallVector extentOperands; for (auto extent : op.getShape()) { extentOperands.push_back( rewriter.create(loc, extent.getLimitedValue())); } Type resultTy = RankedTensorType::get({op.getShape().size()}, rewriter.getIndexType()); Value tensor = rewriter.create(loc, resultTy, extentOperands); rewriter.replaceOpWithNewOp(op, resultTy, tensor); return success(); } namespace { class ConstSizeOpConversion : public OpConversionPattern { public: using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(ConstSizeOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; } // namespace LogicalResult ConstSizeOpConversion::matchAndRewrite( ConstSizeOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { rewriter.replaceOpWithNewOp( op, op.getValue().getSExtValue()); return success(); } namespace { struct IsBroadcastableOpConverter : public OpConversionPattern { using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(IsBroadcastableOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; } // namespace LogicalResult IsBroadcastableOpConverter::matchAndRewrite( IsBroadcastableOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { // For now, this lowering is only defined on `tensor` operands, not // on shapes. if (!llvm::all_of(op.getShapes(), [](Value v) { return !v.getType().isa(); })) return failure(); auto loc = op.getLoc(); ImplicitLocOpBuilder lb(loc, rewriter); Value zero = lb.create(0); Value one = lb.create(1); Type indexTy = lb.getIndexType(); // Save all the ranks for bounds checking. Because this is a tensor // representing the shape extents, the rank is the extent of the only // dimension in the tensor. SmallVector ranks, rankDiffs; llvm::append_range(ranks, llvm::map_range(adaptor.getShapes(), [&](Value v) { return lb.create(v, zero); })); // Find the maximum rank Value maxRank = ranks.front(); for (Value v : llvm::drop_begin(ranks, 1)) { Value rankIsGreater = lb.create(arith::CmpIPredicate::ugt, v, maxRank); maxRank = lb.create(rankIsGreater, v, maxRank); } // Calculate the difference of ranks and the maximum rank for later offsets. llvm::append_range(rankDiffs, llvm::map_range(ranks, [&](Value v) { return lb.create(indexTy, maxRank, v); })); Type i1Ty = rewriter.getI1Type(); Value trueVal = rewriter.create(loc, i1Ty, rewriter.getBoolAttr(true)); auto reduceResult = lb.create( loc, zero, maxRank, one, ValueRange{trueVal}, [&](OpBuilder &b, Location loc, Value iv, ValueRange iterArgs) { // Find a non-1 dim, if it exists. Note that the first part of this // could reuse the Broadcast lowering entirely, but we redo the work // here to make optimizations easier between the two loops. Value broadcastedDim = getBroadcastedDim( ImplicitLocOpBuilder(loc, b), adaptor.getShapes(), rankDiffs, iv); Value broadcastable = iterArgs[0]; for (auto tup : llvm::zip(adaptor.getShapes(), rankDiffs)) { Value shape, rankDiff; std::tie(shape, rankDiff) = tup; Value outOfBounds = b.create( loc, arith::CmpIPredicate::ult, iv, rankDiff); broadcastable = b.create( loc, TypeRange{i1Ty}, outOfBounds, [&](OpBuilder &b, Location loc) { // Non existent dimensions are always broadcastable b.create(loc, broadcastable); }, [&](OpBuilder &b, Location loc) { // Every value needs to be either 1, or the same non-1 // value to be broadcastable in this dim. Value operandDimension = b.create(loc, indexTy, iv, rankDiff); Value dimensionExtent = b.create( loc, shape, ValueRange{operandDimension}); Value equalOne = b.create( loc, arith::CmpIPredicate::eq, dimensionExtent, one); Value equalBroadcasted = b.create( loc, arith::CmpIPredicate::eq, dimensionExtent, broadcastedDim); Value result = b.create( loc, broadcastable, b.create(loc, equalOne, equalBroadcasted)); b.create(loc, result); }) .getResult(0); } b.create(loc, broadcastable); }); rewriter.replaceOp(op, reduceResult.getResults().front()); return success(); } namespace { class GetExtentOpConverter : public OpConversionPattern { using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(GetExtentOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; } // namespace LogicalResult GetExtentOpConverter::matchAndRewrite( GetExtentOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { // For now, only error-free types are supported by this lowering. if (op.getType().isa()) return failure(); // Derive shape extent directly from shape origin if possible. This // circumvents the necessity to materialize the shape in memory. if (auto shapeOfOp = op.getShape().getDefiningOp()) { if (shapeOfOp.getArg().getType().isa()) { rewriter.replaceOpWithNewOp(op, shapeOfOp.getArg(), adaptor.getDim()); return success(); } } rewriter.replaceOpWithNewOp(op, rewriter.getIndexType(), adaptor.getShape(), ValueRange{adaptor.getDim()}); return success(); } namespace { class RankOpConverter : public OpConversionPattern { public: using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(shape::RankOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; } // namespace LogicalResult RankOpConverter::matchAndRewrite(shape::RankOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { // For now, this lowering supports only error-free types. if (op.getType().isa()) return failure(); rewriter.replaceOpWithNewOp(op, adaptor.getShape(), 0); return success(); } namespace { /// Converts `shape.reduce` to `scf.for`. struct ReduceOpConverter : public OpConversionPattern { public: using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(shape::ReduceOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const final; }; } // namespace LogicalResult ReduceOpConverter::matchAndRewrite(shape::ReduceOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { // For now, this lowering is only defined on `tensor` operands. if (op.getShape().getType().isa()) return failure(); auto loc = op.getLoc(); Value zero = rewriter.create(loc, 0); Value one = rewriter.create(loc, 1); Type indexTy = rewriter.getIndexType(); Value rank = rewriter.create(loc, indexTy, adaptor.getShape(), zero); auto loop = rewriter.create( loc, zero, rank, one, op.getInitVals(), [&](OpBuilder &b, Location loc, Value iv, ValueRange args) { Value extent = b.create(loc, adaptor.getShape(), iv); SmallVector mappedValues{iv, extent}; mappedValues.append(args.begin(), args.end()); BlockAndValueMapping mapping; Block *reduceBody = op.getBody(); mapping.map(reduceBody->getArguments(), mappedValues); for (auto &nested : reduceBody->without_terminator()) b.clone(nested, mapping); SmallVector mappedResults; for (auto result : reduceBody->getTerminator()->getOperands()) mappedResults.push_back(mapping.lookup(result)); b.create(loc, mappedResults); }); rewriter.replaceOp(op, loop.getResults()); return success(); } namespace { /// Converts `shape.shape_eq` to an `scf.for` loop. For now, the lowering is /// only defined on `tensor` operands. The test for equality first /// compares their size and, if equal, checks every extent for equality. /// /// Example: /// /// %result = shape.shape_eq %a, %b : tensor, tensor /// /// becomes /// /// %c0 = arith.constant 0 : index /// %0 = dim %arg0, %c0 : tensor /// %1 = dim %arg1, %c0 : tensor /// %2 = arith.cmpi "eq", %0, %1 : index /// %result = scf.if %2 -> (i1) { /// %c1 = arith.constant 1 : index /// %true = arith.constant true /// %4 = scf.for %arg2 = %c0 to %0 step %c1 iter_args(%arg3 = %true) -> (i1) { /// %5 = tensor.extract %arg0[%arg2] : tensor /// %6 = tensor.extract %arg1[%arg2] : tensor /// %7 = arith.cmpi "eq", %5, %6 : index /// %8 = arith.andi %arg3, %7 : i1 /// scf.yield %8 : i1 /// } /// scf.yield %4 : i1 /// } else { /// %false = arith.constant false /// scf.yield %false : i1 /// } /// struct ShapeEqOpConverter : public OpConversionPattern { using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(ShapeEqOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; } // namespace LogicalResult ShapeEqOpConverter::matchAndRewrite(ShapeEqOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { if (!llvm::all_of(op.getShapes(), [](Value v) { return !v.getType().isa(); })) return failure(); Type i1Ty = rewriter.getI1Type(); if (op.getShapes().size() <= 1) { rewriter.replaceOpWithNewOp(op, i1Ty, rewriter.getBoolAttr(true)); return success(); } auto loc = op.getLoc(); Type indexTy = rewriter.getIndexType(); Value zero = rewriter.create(loc, 0); Value firstShape = adaptor.getShapes().front(); Value firstRank = rewriter.create(loc, indexTy, firstShape, zero); Value result = nullptr; // Generate a linear sequence of compares, all with firstShape as lhs. for (Value shape : adaptor.getShapes().drop_front(1)) { Value rank = rewriter.create(loc, indexTy, shape, zero); Value eqRank = rewriter.create(loc, arith::CmpIPredicate::eq, firstRank, rank); auto same = rewriter.create( loc, i1Ty, eqRank, [&](OpBuilder &b, Location loc) { Value one = b.create(loc, 1); Value init = b.create(loc, i1Ty, b.getBoolAttr(true)); auto loop = b.create( loc, zero, firstRank, one, ValueRange{init}, [&](OpBuilder &b, Location nestedLoc, Value iv, ValueRange args) { Value conj = args[0]; Value lhsExtent = b.create(loc, firstShape, iv); Value rhsExtent = b.create(loc, shape, iv); Value eqExtent = b.create( loc, arith::CmpIPredicate::eq, lhsExtent, rhsExtent); Value conjNext = b.create(loc, conj, eqExtent); b.create(loc, ValueRange({conjNext})); }); b.create(loc, loop.getResults()); }, [&](OpBuilder &b, Location loc) { Value result = b.create(loc, i1Ty, b.getBoolAttr(false)); b.create(loc, result); }); result = !result ? same.getResult(0) : rewriter.create(loc, result, same.getResult(0)); } rewriter.replaceOp(op, result); return success(); } namespace { class ShapeOfOpConversion : public OpConversionPattern { public: using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(ShapeOfOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; } // namespace LogicalResult ShapeOfOpConversion::matchAndRewrite( ShapeOfOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { // For now, only error-free types are supported by this lowering. if (op.getType().isa()) return failure(); // For ranked tensor arguments, lower to `tensor.from_elements`. auto loc = op.getLoc(); Value tensor = adaptor.getArg(); Type tensorTy = tensor.getType(); if (tensorTy.isa()) { // Build values for individual extents. SmallVector extentValues; RankedTensorType rankedTensorTy = tensorTy.cast(); int64_t rank = rankedTensorTy.getRank(); for (int64_t i = 0; i < rank; i++) { if (rankedTensorTy.isDynamicDim(i)) { Value extent = rewriter.create(loc, tensor, i); extentValues.push_back(extent); } else { Value extent = rewriter.create( loc, rankedTensorTy.getDimSize(i)); extentValues.push_back(extent); } } // Materialize extent tensor. Value staticExtentTensor = rewriter.create( loc, RankedTensorType::get({rank}, rewriter.getIndexType()), extentValues); rewriter.replaceOpWithNewOp(op, op.getType(), staticExtentTensor); return success(); } // Lower to `tensor.generate` otherwise. auto *ctx = rewriter.getContext(); Value rank = rewriter.create(loc, tensor); rewriter.replaceOpWithNewOp( op, getExtentTensorType(ctx), ValueRange{rank}, [&](OpBuilder &b, Location loc, ValueRange args) { Value dim = args.front(); Value extent = b.create(loc, tensor, dim); b.create(loc, extent); }); return success(); } namespace { class SplitAtOpConversion : public OpConversionPattern { public: using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(SplitAtOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override; }; } // namespace LogicalResult SplitAtOpConversion::matchAndRewrite( SplitAtOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const { // Error conditions are not implemented, only lower if all operands and // results are extent tensors. if (llvm::any_of(ValueRange{op.getOperand(), op.getHead(), op.getTail()}, [](Value v) { return v.getType().isa(); })) return failure(); ImplicitLocOpBuilder b(op.getLoc(), rewriter); Value zero = b.create(0); Value rank = b.create(adaptor.getOperand(), zero); // index < 0 ? index + rank : index Value originalIndex = adaptor.getIndex(); Value add = b.create(originalIndex, rank); Value indexIsNegative = b.create(arith::CmpIPredicate::slt, originalIndex, zero); Value index = b.create(indexIsNegative, add, originalIndex); Value one = b.create(1); Value head = b.create(adaptor.getOperand(), zero, index, one); Value tailSize = b.create(rank, index); Value tail = b.create(adaptor.getOperand(), index, tailSize, one); rewriter.replaceOp(op, {head, tail}); return success(); } namespace { class ToExtentTensorOpConversion : public OpConversionPattern { public: using OpConversionPattern::OpConversionPattern; LogicalResult matchAndRewrite(ToExtentTensorOp op, OpAdaptor adaptor, ConversionPatternRewriter &rewriter) const override { if (!adaptor.getInput().getType().isa()) return rewriter.notifyMatchFailure(op, "input needs to be a tensor"); rewriter.replaceOpWithNewOp(op, op.getType(), adaptor.getInput()); return success(); } }; } // namespace namespace { /// Import the Shape Ops to Std Patterns. #include "ShapeToStandard.cpp.inc" } // namespace namespace { /// Conversion pass. class ConvertShapeToStandardPass : public ConvertShapeToStandardBase { void runOnOperation() override; }; } // namespace void ConvertShapeToStandardPass::runOnOperation() { // Setup target legality. MLIRContext &ctx = getContext(); ConversionTarget target(ctx); target.addLegalDialect(); target.addLegalOp(); // Setup conversion patterns. RewritePatternSet patterns(&ctx); populateShapeToStandardConversionPatterns(patterns); // Apply conversion. auto module = getOperation(); if (failed(applyPartialConversion(module, target, std::move(patterns)))) signalPassFailure(); } void mlir::populateShapeToStandardConversionPatterns( RewritePatternSet &patterns) { // clang-format off populateWithGenerated(patterns); patterns.add< AnyOpConversion, BinaryOpConversion, BinaryOpConversion, BroadcastOpConverter, ConstShapeOpConverter, ConstSizeOpConversion, IsBroadcastableOpConverter, GetExtentOpConverter, RankOpConverter, ReduceOpConverter, ShapeEqOpConverter, ShapeOfOpConversion, SplitAtOpConversion, ToExtentTensorOpConversion>(patterns.getContext()); // clang-format on } std::unique_ptr> mlir::createConvertShapeToStandardPass() { return std::make_unique(); }