149e37000SMatthias Springer //===- BufferizableOpInterfaceImpl.cpp - Impl. of BufferizableOpInterface -===// 249e37000SMatthias Springer // 349e37000SMatthias Springer // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 449e37000SMatthias Springer // See https://llvm.org/LICENSE.txt for license information. 549e37000SMatthias Springer // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 649e37000SMatthias Springer // 749e37000SMatthias Springer //===----------------------------------------------------------------------===// 849e37000SMatthias Springer 949e37000SMatthias Springer #include "mlir/Dialect/Tensor/Transforms/BufferizableOpInterfaceImpl.h" 1049e37000SMatthias Springer #include "mlir/Dialect/Bufferization/IR/BufferizableOpInterface.h" 1149e37000SMatthias Springer #include "mlir/Dialect/MemRef/IR/MemRef.h" 12*71bbb78bSMatthias Springer #include "mlir/Dialect/SCF/SCF.h" 1349e37000SMatthias Springer #include "mlir/Dialect/Tensor/IR/Tensor.h" 1449e37000SMatthias Springer #include "mlir/IR/Dialect.h" 1549e37000SMatthias Springer #include "mlir/IR/Operation.h" 1649e37000SMatthias Springer 1749e37000SMatthias Springer using namespace mlir; 1849e37000SMatthias Springer using namespace mlir::bufferization; 1949e37000SMatthias Springer using namespace mlir::tensor; 2049e37000SMatthias Springer 2149e37000SMatthias Springer namespace mlir { 2249e37000SMatthias Springer namespace tensor { 2349e37000SMatthias Springer namespace { 2449e37000SMatthias Springer 2549e37000SMatthias Springer struct CastOpInterface 2649e37000SMatthias Springer : public BufferizableOpInterface::ExternalModel<CastOpInterface, 2749e37000SMatthias Springer tensor::CastOp> { 2849e37000SMatthias Springer bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand, 2949e37000SMatthias Springer const BufferizationState &state) const { 3049e37000SMatthias Springer return false; 3149e37000SMatthias Springer } 3249e37000SMatthias Springer 3349e37000SMatthias Springer bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand, 3449e37000SMatthias Springer const BufferizationState &state) const { 3549e37000SMatthias Springer return false; 3649e37000SMatthias Springer } 3749e37000SMatthias Springer 3849e37000SMatthias Springer OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand, 3949e37000SMatthias Springer const BufferizationState &state) const { 4049e37000SMatthias Springer return op->getResult(0); 4149e37000SMatthias Springer } 4249e37000SMatthias Springer 4349e37000SMatthias Springer BufferRelation bufferRelation(Operation *op, OpResult opResult, 4449e37000SMatthias Springer const BufferizationState &state) const { 4549e37000SMatthias Springer return BufferRelation::Equivalent; 4649e37000SMatthias Springer } 4749e37000SMatthias Springer 4849e37000SMatthias Springer LogicalResult bufferize(Operation *op, RewriterBase &rewriter, 4949e37000SMatthias Springer const BufferizationState &state) const { 5049e37000SMatthias Springer auto castOp = cast<tensor::CastOp>(op); 5149e37000SMatthias Springer 5249e37000SMatthias Springer // The result buffer still has the old (pre-cast) type. 5349e37000SMatthias Springer FailureOr<Value> resultBuffer = 5449e37000SMatthias Springer state.getBuffer(rewriter, castOp->getOpOperand(0) /*source*/); 5549e37000SMatthias Springer if (failed(resultBuffer)) 5649e37000SMatthias Springer return failure(); 5749e37000SMatthias Springer auto sourceMemRefType = resultBuffer->getType().cast<BaseMemRefType>(); 5849e37000SMatthias Springer Attribute memorySpace = sourceMemRefType.getMemorySpace(); 5949e37000SMatthias Springer TensorType resultTensorType = 6049e37000SMatthias Springer castOp.getResult().getType().cast<TensorType>(); 6149e37000SMatthias Springer MemRefLayoutAttrInterface layout; 6249e37000SMatthias Springer 6349e37000SMatthias Springer if (auto rankedMemRefType = sourceMemRefType.dyn_cast<MemRefType>()) 6449e37000SMatthias Springer if (resultTensorType.isa<RankedTensorType>()) 6549e37000SMatthias Springer layout = rankedMemRefType.getLayout(); 6649e37000SMatthias Springer 6749e37000SMatthias Springer // Compute the new memref type. 6849e37000SMatthias Springer Type resultMemRefType; 6949e37000SMatthias Springer if (resultTensorType.isa<RankedTensorType>()) { 7049e37000SMatthias Springer resultMemRefType = 7149e37000SMatthias Springer getContiguousMemRefType(resultTensorType, layout, memorySpace); 7249e37000SMatthias Springer } else { 7349e37000SMatthias Springer resultMemRefType = 7449e37000SMatthias Springer getUnrankedMemRefType(resultTensorType.getElementType(), memorySpace); 7549e37000SMatthias Springer } 7649e37000SMatthias Springer 7749e37000SMatthias Springer // Replace the op with a memref.cast. 7849e37000SMatthias Springer assert(memref::CastOp::areCastCompatible(resultBuffer->getType(), 7949e37000SMatthias Springer resultMemRefType) && 8049e37000SMatthias Springer "CallOp::bufferize: cast incompatible"); 8149e37000SMatthias Springer replaceOpWithNewBufferizedOp<memref::CastOp>(rewriter, op, resultMemRefType, 8249e37000SMatthias Springer *resultBuffer); 8349e37000SMatthias Springer 8449e37000SMatthias Springer return success(); 8549e37000SMatthias Springer } 8649e37000SMatthias Springer }; 8749e37000SMatthias Springer 8849e37000SMatthias Springer /// Bufferization of tensor.dim. Replace with memref.dim. 8949e37000SMatthias Springer struct DimOpInterface 9049e37000SMatthias Springer : public BufferizableOpInterface::ExternalModel<DimOpInterface, 9149e37000SMatthias Springer tensor::DimOp> { 9249e37000SMatthias Springer bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand, 9349e37000SMatthias Springer const BufferizationState &state) const { 9449e37000SMatthias Springer return true; 9549e37000SMatthias Springer } 9649e37000SMatthias Springer 9749e37000SMatthias Springer bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand, 9849e37000SMatthias Springer const BufferizationState &state) const { 9949e37000SMatthias Springer return false; 10049e37000SMatthias Springer } 10149e37000SMatthias Springer 10249e37000SMatthias Springer OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand, 10349e37000SMatthias Springer const BufferizationState &state) const { 10449e37000SMatthias Springer return OpResult(); 10549e37000SMatthias Springer } 10649e37000SMatthias Springer 10749e37000SMatthias Springer LogicalResult bufferize(Operation *op, RewriterBase &rewriter, 10849e37000SMatthias Springer const BufferizationState &state) const { 10949e37000SMatthias Springer auto dimOp = cast<tensor::DimOp>(op); 11049e37000SMatthias Springer Value v = *state.getBuffer(rewriter, dimOp->getOpOperand(0) /*source*/); 11149e37000SMatthias Springer replaceOpWithNewBufferizedOp<memref::DimOp>(rewriter, op, v, dimOp.index()); 11249e37000SMatthias Springer return success(); 11349e37000SMatthias Springer } 11449e37000SMatthias Springer }; 11549e37000SMatthias Springer 11649e37000SMatthias Springer /// Bufferization of tensor.extract_slice. Replace with memref.subview. 11749e37000SMatthias Springer struct ExtractSliceOpInterface 11849e37000SMatthias Springer : public BufferizableOpInterface::ExternalModel<ExtractSliceOpInterface, 11949e37000SMatthias Springer tensor::ExtractSliceOp> { 12049e37000SMatthias Springer bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand, 12149e37000SMatthias Springer const BufferizationState &state) const { 12249e37000SMatthias Springer return false; 12349e37000SMatthias Springer } 12449e37000SMatthias Springer 12549e37000SMatthias Springer bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand, 12649e37000SMatthias Springer const BufferizationState &state) const { 12749e37000SMatthias Springer return false; 12849e37000SMatthias Springer } 12949e37000SMatthias Springer 13049e37000SMatthias Springer OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand, 13149e37000SMatthias Springer const BufferizationState &state) const { 13249e37000SMatthias Springer return &opOperand == &op->getOpOperand(0) /*source*/ 13349e37000SMatthias Springer ? op->getResult(0) 13449e37000SMatthias Springer : OpResult(); 13549e37000SMatthias Springer } 13649e37000SMatthias Springer 13749e37000SMatthias Springer BufferRelation bufferRelation(Operation *op, OpResult opResult, 13849e37000SMatthias Springer const BufferizationState &state) const { 13949e37000SMatthias Springer return BufferRelation::None; 14049e37000SMatthias Springer } 14149e37000SMatthias Springer 14249e37000SMatthias Springer LogicalResult bufferize(Operation *op, RewriterBase &rewriter, 14349e37000SMatthias Springer const BufferizationState &state) const { 14449e37000SMatthias Springer auto extractSliceOp = cast<tensor::ExtractSliceOp>(op); 14549e37000SMatthias Springer Location loc = extractSliceOp.getLoc(); 14649e37000SMatthias Springer Value srcMemref = 14749e37000SMatthias Springer *state.getBuffer(rewriter, extractSliceOp->getOpOperand(0) /*source*/, 14849e37000SMatthias Springer /*forceInPlace=*/true); 14949e37000SMatthias Springer auto srcMemrefType = srcMemref.getType().cast<MemRefType>(); 15049e37000SMatthias Springer auto dstTensorType = 15149e37000SMatthias Springer extractSliceOp.result().getType().cast<RankedTensorType>(); 15249e37000SMatthias Springer 15349e37000SMatthias Springer // If not inplaceable, alloc. 15449e37000SMatthias Springer bool inplace = state.isInPlace(extractSliceOp->getOpOperand(0)); 15549e37000SMatthias Springer Value alloc; 15649e37000SMatthias Springer if (!inplace) { 15749e37000SMatthias Springer FailureOr<Value> allocOrFailure = 15849e37000SMatthias Springer createAlloc(rewriter, loc, extractSliceOp.result(), 15949e37000SMatthias Springer state.getOptions().createDeallocs, state.getOptions()); 16049e37000SMatthias Springer if (failed(allocOrFailure)) 16149e37000SMatthias Springer return failure(); 16249e37000SMatthias Springer alloc = *allocOrFailure; 16349e37000SMatthias Springer } 16449e37000SMatthias Springer 16549e37000SMatthias Springer // Expand offsets, sizes and strides to the full rank to handle the 16649e37000SMatthias Springer // rank-reducing case. 16749e37000SMatthias Springer SmallVector<OpFoldResult> mixedOffsets = extractSliceOp.getMixedOffsets(); 16849e37000SMatthias Springer SmallVector<OpFoldResult> mixedSizes = extractSliceOp.getMixedSizes(); 16949e37000SMatthias Springer SmallVector<OpFoldResult> mixedStrides = extractSliceOp.getMixedStrides(); 17049e37000SMatthias Springer OffsetSizeAndStrideOpInterface::expandToRank( 17149e37000SMatthias Springer srcMemref, mixedOffsets, mixedSizes, mixedStrides, 17249e37000SMatthias Springer [&](Value target, int64_t dim) -> OpFoldResult { 17349e37000SMatthias Springer auto shapedType = target.getType().cast<ShapedType>(); 17449e37000SMatthias Springer if (shapedType.isDynamicDim(dim)) 17549e37000SMatthias Springer return rewriter.create<memref::DimOp>(loc, target, dim).result(); 17649e37000SMatthias Springer return rewriter.getIndexAttr(shapedType.getDimSize(dim)); 17749e37000SMatthias Springer }); 17849e37000SMatthias Springer // Bufferize to subview. 17949e37000SMatthias Springer auto subviewMemRefType = memref::SubViewOp::inferRankReducedResultType( 18049e37000SMatthias Springer dstTensorType.getRank(), srcMemrefType, 18149e37000SMatthias Springer mixedOffsets, mixedSizes, mixedStrides) 18249e37000SMatthias Springer .cast<MemRefType>(); 18349e37000SMatthias Springer Value subView = rewriter.create<memref::SubViewOp>( 18449e37000SMatthias Springer loc, subviewMemRefType, srcMemref, mixedOffsets, mixedSizes, 18549e37000SMatthias Springer mixedStrides); 18649e37000SMatthias Springer 18749e37000SMatthias Springer // If not inplaceable, copy. 18849e37000SMatthias Springer if (!inplace) { 18949e37000SMatthias Springer // Do not copy if the copied data is never read. 19049e37000SMatthias Springer if (state.isValueRead(extractSliceOp.result())) 19149e37000SMatthias Springer if (failed(createMemCpy(rewriter, extractSliceOp.getLoc(), subView, 19249e37000SMatthias Springer alloc, state.getOptions()))) 19349e37000SMatthias Springer return failure(); 19449e37000SMatthias Springer subView = alloc; 19549e37000SMatthias Springer } 19649e37000SMatthias Springer 19749e37000SMatthias Springer replaceOpWithBufferizedValues(rewriter, op, subView); 19849e37000SMatthias Springer return success(); 19949e37000SMatthias Springer } 20049e37000SMatthias Springer }; 20149e37000SMatthias Springer 20249e37000SMatthias Springer /// Bufferization of tensor.extract. Replace with memref.load. 20349e37000SMatthias Springer struct ExtractOpInterface 20449e37000SMatthias Springer : public BufferizableOpInterface::ExternalModel<ExtractOpInterface, 20549e37000SMatthias Springer tensor::ExtractOp> { 20649e37000SMatthias Springer bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand, 20749e37000SMatthias Springer const BufferizationState &state) const { 20849e37000SMatthias Springer return true; 20949e37000SMatthias Springer } 21049e37000SMatthias Springer 21149e37000SMatthias Springer bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand, 21249e37000SMatthias Springer const BufferizationState &state) const { 21349e37000SMatthias Springer return false; 21449e37000SMatthias Springer } 21549e37000SMatthias Springer 21649e37000SMatthias Springer OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand, 21749e37000SMatthias Springer const BufferizationState &state) const { 21849e37000SMatthias Springer return OpResult(); 21949e37000SMatthias Springer } 22049e37000SMatthias Springer 22149e37000SMatthias Springer LogicalResult bufferize(Operation *op, RewriterBase &rewriter, 22249e37000SMatthias Springer const BufferizationState &state) const { 22349e37000SMatthias Springer auto extractOp = cast<tensor::ExtractOp>(op); 22449e37000SMatthias Springer Value srcMemref = 22549e37000SMatthias Springer *state.getBuffer(rewriter, extractOp->getOpOperand(0) /*tensor*/); 22649e37000SMatthias Springer replaceOpWithNewBufferizedOp<memref::LoadOp>(rewriter, op, srcMemref, 22749e37000SMatthias Springer extractOp.indices()); 22849e37000SMatthias Springer return success(); 22949e37000SMatthias Springer } 23049e37000SMatthias Springer }; 23149e37000SMatthias Springer 232*71bbb78bSMatthias Springer /// Bufferization of tensor.generate. 233*71bbb78bSMatthias Springer struct GenerateOpInterface 234*71bbb78bSMatthias Springer : public BufferizableOpInterface::ExternalModel<GenerateOpInterface, 235*71bbb78bSMatthias Springer tensor::GenerateOp> { 236*71bbb78bSMatthias Springer LogicalResult bufferize(Operation *op, RewriterBase &rewriter, 237*71bbb78bSMatthias Springer const BufferizationState &state) const { 238*71bbb78bSMatthias Springer auto generateOp = cast<tensor::GenerateOp>(op); 239*71bbb78bSMatthias Springer 240*71bbb78bSMatthias Springer // Allocate memory. 241*71bbb78bSMatthias Springer Location loc = op->getLoc(); 242*71bbb78bSMatthias Springer MemRefType memrefType = 243*71bbb78bSMatthias Springer getContiguousMemRefType(generateOp.getType().cast<RankedTensorType>()); 244*71bbb78bSMatthias Springer FailureOr<Value> maybeResult = 245*71bbb78bSMatthias Springer createAlloc(rewriter, loc, memrefType, generateOp.dynamicExtents(), 246*71bbb78bSMatthias Springer /*deallocMemref=*/state.getOptions().createDeallocs, 247*71bbb78bSMatthias Springer state.getOptions()); 248*71bbb78bSMatthias Springer if (failed(maybeResult)) 249*71bbb78bSMatthias Springer return failure(); 250*71bbb78bSMatthias Springer Value result = *maybeResult; 251*71bbb78bSMatthias Springer 252*71bbb78bSMatthias Springer // Collect loop bounds. 253*71bbb78bSMatthias Springer int64_t rank = memrefType.getRank(); 254*71bbb78bSMatthias Springer Value zero = rewriter.create<arith::ConstantIndexOp>(loc, 0); 255*71bbb78bSMatthias Springer Value one = rewriter.create<arith::ConstantIndexOp>(loc, 1); 256*71bbb78bSMatthias Springer SmallVector<Value, 4> lowerBounds(rank, zero); 257*71bbb78bSMatthias Springer SmallVector<Value, 4> steps(rank, one); 258*71bbb78bSMatthias Springer SmallVector<Value, 4> upperBounds; 259*71bbb78bSMatthias Springer int nextDynamicIndex = 0; 260*71bbb78bSMatthias Springer for (int i = 0; i < rank; i++) { 261*71bbb78bSMatthias Springer Value upperBound = memrefType.isDynamicDim(i) 262*71bbb78bSMatthias Springer ? generateOp.dynamicExtents()[nextDynamicIndex++] 263*71bbb78bSMatthias Springer : rewriter.create<arith::ConstantIndexOp>( 264*71bbb78bSMatthias Springer loc, memrefType.getDimSize(i)); 265*71bbb78bSMatthias Springer upperBounds.push_back(upperBound); 266*71bbb78bSMatthias Springer } 267*71bbb78bSMatthias Springer 268*71bbb78bSMatthias Springer // Generate tensor elements with a parallel loop that stores into 269*71bbb78bSMatthias Springer // each element of the resulting memref. We use mergeBlockBefore to "move" 270*71bbb78bSMatthias Springer // this op's body into the scf.parallel's body. 271*71bbb78bSMatthias Springer auto parallel = 272*71bbb78bSMatthias Springer rewriter.create<scf::ParallelOp>(loc, lowerBounds, upperBounds, steps); 273*71bbb78bSMatthias Springer Block *parallelBody = parallel.getBody(); 274*71bbb78bSMatthias Springer rewriter.mergeBlockBefore(generateOp.getBody(), 275*71bbb78bSMatthias Springer parallelBody->getTerminator(), 276*71bbb78bSMatthias Springer parallelBody->getArguments()); 277*71bbb78bSMatthias Springer // Replace the inlined yield op with a store op. The scf.parallel's builder 278*71bbb78bSMatthias Springer // already populated an scf.yield at the end, so we don't need to worry 279*71bbb78bSMatthias Springer // about creating that. 280*71bbb78bSMatthias Springer Operation *elementYield = parallelBody->getTerminator()->getPrevNode(); 281*71bbb78bSMatthias Springer rewriter.setInsertionPointAfter(elementYield); 282*71bbb78bSMatthias Springer rewriter.replaceOpWithNewOp<memref::StoreOp>( 283*71bbb78bSMatthias Springer elementYield, elementYield->getOperands()[0], result, 284*71bbb78bSMatthias Springer parallelBody->getArguments()); 285*71bbb78bSMatthias Springer 286*71bbb78bSMatthias Springer replaceOpWithBufferizedValues(rewriter, op, result); 287*71bbb78bSMatthias Springer return success(); 288*71bbb78bSMatthias Springer } 289*71bbb78bSMatthias Springer }; 290*71bbb78bSMatthias Springer 29149e37000SMatthias Springer /// Bufferization of tensor.insert. Replace with memref.store. 29249e37000SMatthias Springer struct InsertOpInterface 29349e37000SMatthias Springer : public BufferizableOpInterface::ExternalModel<InsertOpInterface, 29449e37000SMatthias Springer tensor::InsertOp> { 29549e37000SMatthias Springer bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand, 29649e37000SMatthias Springer const BufferizationState &state) const { 29749e37000SMatthias Springer return true; 29849e37000SMatthias Springer } 29949e37000SMatthias Springer 30049e37000SMatthias Springer bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand, 30149e37000SMatthias Springer const BufferizationState &state) const { 30249e37000SMatthias Springer return true; 30349e37000SMatthias Springer } 30449e37000SMatthias Springer 30549e37000SMatthias Springer OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand, 30649e37000SMatthias Springer const BufferizationState &state) const { 30749e37000SMatthias Springer assert(&opOperand == &op->getOpOperand(1) /*dest*/ && 30849e37000SMatthias Springer "expected dest OpOperand"); 30949e37000SMatthias Springer return op->getOpResult(0); 31049e37000SMatthias Springer } 31149e37000SMatthias Springer 31249e37000SMatthias Springer SmallVector<OpOperand *> 31349e37000SMatthias Springer getAliasingOpOperand(Operation *op, OpResult opResult, 31449e37000SMatthias Springer const BufferizationState &state) const { 31549e37000SMatthias Springer return {&op->getOpOperand(1) /*dest*/}; 31649e37000SMatthias Springer } 31749e37000SMatthias Springer 31849e37000SMatthias Springer LogicalResult bufferize(Operation *op, RewriterBase &rewriter, 31949e37000SMatthias Springer const BufferizationState &state) const { 32049e37000SMatthias Springer auto insertOp = cast<tensor::InsertOp>(op); 32149e37000SMatthias Springer FailureOr<Value> destMemref = 32249e37000SMatthias Springer state.getBuffer(rewriter, insertOp->getOpOperand(1) /*dest*/); 32349e37000SMatthias Springer if (failed(destMemref)) 32449e37000SMatthias Springer return failure(); 32549e37000SMatthias Springer rewriter.create<memref::StoreOp>(insertOp.getLoc(), insertOp.scalar(), 32649e37000SMatthias Springer *destMemref, insertOp.indices()); 32749e37000SMatthias Springer replaceOpWithBufferizedValues(rewriter, op, *destMemref); 32849e37000SMatthias Springer return success(); 32949e37000SMatthias Springer } 33049e37000SMatthias Springer 33149e37000SMatthias Springer BufferRelation bufferRelation(Operation *op, OpResult opResult, 33249e37000SMatthias Springer const BufferizationState &state) const { 33349e37000SMatthias Springer return BufferRelation::Equivalent; 33449e37000SMatthias Springer } 33549e37000SMatthias Springer }; 33649e37000SMatthias Springer 33749e37000SMatthias Springer /// Return true if the (ExtractSliceOp, InsertSliceOp) pair match (i.e. 33849e37000SMatthias Springer /// equivalent operand / result and same offset/sizes/strides specification). 33949e37000SMatthias Springer /// 34049e37000SMatthias Springer /// This is one particular type of relationship between ops on tensors that 34149e37000SMatthias Springer /// reduce to an equivalence on buffers. This should be generalized and 34249e37000SMatthias Springer /// exposed as interfaces on the proper types. 34349e37000SMatthias Springer static bool areEquivalentExtractSliceOps(const BufferizationState &state, 34449e37000SMatthias Springer ExtractSliceOp st, InsertSliceOp sti) { 34549e37000SMatthias Springer if (!st || !sti) 34649e37000SMatthias Springer return false; 34749e37000SMatthias Springer if (sti != sti && 34849e37000SMatthias Springer !state.areEquivalentBufferizedValues(st.source(), sti.dest())) 34949e37000SMatthias Springer return false; 35049e37000SMatthias Springer if (!sameOffsetsSizesAndStrides(st, sti, isEqualConstantIntOrValue)) 35149e37000SMatthias Springer return false; 35249e37000SMatthias Springer return true; 35349e37000SMatthias Springer } 35449e37000SMatthias Springer 35549e37000SMatthias Springer /// Return true if `value` is originating from an ExtractSliceOp that matches 35649e37000SMatthias Springer /// the given InsertSliceOp. 35749e37000SMatthias Springer static bool hasMatchingExtractSliceOp(const BufferizationState &state, 35849e37000SMatthias Springer Value value, InsertSliceOp insertOp) { 35949e37000SMatthias Springer auto condition = [&](Value val) { 36049e37000SMatthias Springer if (auto extractOp = val.getDefiningOp<ExtractSliceOp>()) 36149e37000SMatthias Springer if (areEquivalentExtractSliceOps(state, extractOp, insertOp)) 36249e37000SMatthias Springer return true; 36349e37000SMatthias Springer return false; 36449e37000SMatthias Springer }; 36549e37000SMatthias Springer 36649e37000SMatthias Springer return llvm::all_of(state.findValueInReverseUseDefChain(value, condition), 36749e37000SMatthias Springer condition); 36849e37000SMatthias Springer } 36949e37000SMatthias Springer 37049e37000SMatthias Springer /// Bufferization of tensor.insert_slice. Replace with a memory copy. Under 37149e37000SMatthias Springer /// certain circumstances, this op can also be a no-op. 37249e37000SMatthias Springer struct InsertSliceOpInterface 37349e37000SMatthias Springer : public BufferizableOpInterface::ExternalModel<InsertSliceOpInterface, 37449e37000SMatthias Springer tensor::InsertSliceOp> { 37549e37000SMatthias Springer bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand, 37649e37000SMatthias Springer const BufferizationState &state) const { 37749e37000SMatthias Springer return true; 37849e37000SMatthias Springer } 37949e37000SMatthias Springer 38049e37000SMatthias Springer bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand, 38149e37000SMatthias Springer const BufferizationState &state) const { 38249e37000SMatthias Springer return &opOperand == &op->getOpOperand(1) /*dest*/; 38349e37000SMatthias Springer } 38449e37000SMatthias Springer 38549e37000SMatthias Springer OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand, 38649e37000SMatthias Springer const BufferizationState &state) const { 38749e37000SMatthias Springer return &opOperand == &op->getOpOperand(1) /*dest*/ 38849e37000SMatthias Springer ? op->getResult(0) 38949e37000SMatthias Springer : OpResult(); 39049e37000SMatthias Springer } 39149e37000SMatthias Springer 39249e37000SMatthias Springer BufferRelation bufferRelation(Operation *op, OpResult opResult, 39349e37000SMatthias Springer const BufferizationState &state) const { 39449e37000SMatthias Springer return BufferRelation::Equivalent; 39549e37000SMatthias Springer } 39649e37000SMatthias Springer 39749e37000SMatthias Springer bool isNotConflicting(Operation *op, OpOperand *uRead, 39849e37000SMatthias Springer OpOperand *uConflictingWrite, 39949e37000SMatthias Springer const BufferizationState &state) const { 40049e37000SMatthias Springer Operation *readingOp = uRead->getOwner(); 40149e37000SMatthias Springer Operation *conflictingWritingOp = uConflictingWrite->getOwner(); 40249e37000SMatthias Springer 40349e37000SMatthias Springer // Special rules for matching ExtractSliceOp/InsertSliceOp pairs. If 40449e37000SMatthias Springer // uRead is an InsertSliceOp... 40549e37000SMatthias Springer if (auto insertSliceOp = dyn_cast<InsertSliceOp>(readingOp)) { 40649e37000SMatthias Springer // As an example, consider the following IR. 40749e37000SMatthias Springer // 40849e37000SMatthias Springer // %0 = tensor.extract_slice %t[%a, %b][%c, %d][1, 1] {inplace = [true] } 40949e37000SMatthias Springer // %1 = linalg.fill %cst, %0 {inplace= [true] } 41049e37000SMatthias Springer // %2 = tensor.insert_slice %1 into %t[%a, %b][%c, %d][1, 1] 41149e37000SMatthias Springer // {inplace= [true] } 41249e37000SMatthias Springer 41349e37000SMatthias Springer // TODO: Use insertSliceOp.getDestOpOperand etc. when available. 41449e37000SMatthias Springer if (uRead == &insertSliceOp->getOpOperand(1) /*dest*/ && 41549e37000SMatthias Springer hasMatchingExtractSliceOp(state, uConflictingWrite->get(), 41649e37000SMatthias Springer insertSliceOp)) 41749e37000SMatthias Springer // Case 1: The main insight is that InsertSliceOp reads only part of 41849e37000SMatthias Springer // the destination tensor. The overwritten area is not read. If 41949e37000SMatthias Springer // uConflictingWrite writes into exactly the memory location that is 42049e37000SMatthias Springer // being read by uRead, this is not a conflict. 42149e37000SMatthias Springer // 42249e37000SMatthias Springer // In the above example: 42349e37000SMatthias Springer // uRead = OpOperand 1 (%t) of tensor.insert_slice 42449e37000SMatthias Springer // uConflictingWrite = OpOperand 1 (%0) of linalg.fill 42549e37000SMatthias Springer // 42649e37000SMatthias Springer // The read of %t does not conflict with the write of the FillOp 42749e37000SMatthias Springer // (same aliases!) because the area that the FillOp operates on is 42849e37000SMatthias Springer // exactly the one that is *not* read via %t. 42949e37000SMatthias Springer return true; 43049e37000SMatthias Springer 43149e37000SMatthias Springer if (uRead == &insertSliceOp->getOpOperand(0) /*source*/ && 43249e37000SMatthias Springer uConflictingWrite == &insertSliceOp->getOpOperand(1) /*dest*/ && 43349e37000SMatthias Springer hasMatchingExtractSliceOp(state, uRead->get(), insertSliceOp)) 43449e37000SMatthias Springer // Case 2: The read of the source tensor and the write to the dest 43549e37000SMatthias Springer // tensor via an InsertSliceOp is not a conflict if the read is 43649e37000SMatthias Springer // reading exactly that part of an equivalent tensor that the 43749e37000SMatthias Springer // InsertSliceOp is writing. 43849e37000SMatthias Springer // 43949e37000SMatthias Springer // In the above example: 44049e37000SMatthias Springer // uRead = OpOperand 0 (%1) of tensor.insert_slice 44149e37000SMatthias Springer // uConflictingWrite = OpOperand 1 (%t) of tensor.insert_slice 44249e37000SMatthias Springer return true; 44349e37000SMatthias Springer } 44449e37000SMatthias Springer 44549e37000SMatthias Springer // If uConflictingWrite is an InsertSliceOp... 44649e37000SMatthias Springer if (auto insertSliceOp = dyn_cast<InsertSliceOp>(conflictingWritingOp)) 44749e37000SMatthias Springer // As an example, consider the following IR. 44849e37000SMatthias Springer // 44949e37000SMatthias Springer // %0 = tensor.extract_slice %t[%a, %b][%c, %d][1, 1] {inplace = [true] } 45049e37000SMatthias Springer // %1 = linalg.fill %cst, %0 {inplace= [true] } 45149e37000SMatthias Springer // %2 = tensor.insert_slice %1 into %t[%a, %b][%c, %d][1, 1] 45249e37000SMatthias Springer // {inplace= [true] } 45349e37000SMatthias Springer // %3 = vector.transfer_read %1, %cst 45449e37000SMatthias Springer // 45549e37000SMatthias Springer // In the above example: 45649e37000SMatthias Springer // uRead = OpOperand 0 (%1) of vector.transfer_read 45749e37000SMatthias Springer // uConflictingWrite = OpOperand 1 (%t) of tensor.insert_slice 45849e37000SMatthias Springer // lastWrite = %1 45949e37000SMatthias Springer // 46049e37000SMatthias Springer // This is not a conflict because the InsertSliceOp overwrites the 46149e37000SMatthias Springer // memory segment of %1 with the exact same data. (Effectively, there 46249e37000SMatthias Springer // is no memory write here.) 46349e37000SMatthias Springer if (uConflictingWrite == &insertSliceOp->getOpOperand(1) /*dest*/ && 46449e37000SMatthias Springer state.areEquivalentBufferizedValues(uRead->get(), 46549e37000SMatthias Springer insertSliceOp.source()) && 46649e37000SMatthias Springer hasMatchingExtractSliceOp(state, insertSliceOp.source(), 46749e37000SMatthias Springer insertSliceOp)) 46849e37000SMatthias Springer return true; 46949e37000SMatthias Springer 47049e37000SMatthias Springer return false; 47149e37000SMatthias Springer } 47249e37000SMatthias Springer 47349e37000SMatthias Springer LogicalResult bufferize(Operation *op, RewriterBase &rewriter, 47449e37000SMatthias Springer const BufferizationState &state) const { 47549e37000SMatthias Springer // insert_slice ops arise from tiling and bufferizing them out-of-place is 47649e37000SMatthias Springer // generally a deal breaker. When used with loops, this ends up cloning the 47749e37000SMatthias Springer // whole tensor on every single iteration and is a symptom of a 47849e37000SMatthias Springer // catastrophically bad scheduling decision. 47949e37000SMatthias Springer // TODO: be very loud about it or even consider failing the pass. 48049e37000SMatthias Springer auto insertSliceOp = cast<tensor::InsertSliceOp>(op); 48149e37000SMatthias Springer Location loc = insertSliceOp.getLoc(); 48249e37000SMatthias Springer 48349e37000SMatthias Springer // When bufferizing out-of-place, `getResultBuffer` allocates. 48449e37000SMatthias Springer FailureOr<Value> dstMemref = 48549e37000SMatthias Springer state.getBuffer(rewriter, insertSliceOp->getOpOperand(1) /*dest*/); 48649e37000SMatthias Springer if (failed(dstMemref)) 48749e37000SMatthias Springer return failure(); 48849e37000SMatthias Springer 48949e37000SMatthias Springer // Expand offsets, sizes and strides to the full rank to handle the 49049e37000SMatthias Springer // rank-reducing case. 49149e37000SMatthias Springer SmallVector<OpFoldResult> mixedOffsets = insertSliceOp.getMixedOffsets(); 49249e37000SMatthias Springer SmallVector<OpFoldResult> mixedSizes = insertSliceOp.getMixedSizes(); 49349e37000SMatthias Springer SmallVector<OpFoldResult> mixedStrides = insertSliceOp.getMixedStrides(); 49449e37000SMatthias Springer OffsetSizeAndStrideOpInterface::expandToRank( 49549e37000SMatthias Springer *dstMemref, mixedOffsets, mixedSizes, mixedStrides, 49649e37000SMatthias Springer [&](Value target, int64_t dim) -> OpFoldResult { 49749e37000SMatthias Springer auto shapedType = target.getType().cast<ShapedType>(); 49849e37000SMatthias Springer if (shapedType.isDynamicDim(dim)) 49949e37000SMatthias Springer return rewriter.create<memref::DimOp>(loc, target, dim).result(); 50049e37000SMatthias Springer return rewriter.getIndexAttr(shapedType.getDimSize(dim)); 50149e37000SMatthias Springer }); 50249e37000SMatthias Springer // Take a subview of the dst. 50349e37000SMatthias Springer auto dstMemrefType = dstMemref->getType().cast<MemRefType>(); 50449e37000SMatthias Springer auto subviewMemRefType = 50549e37000SMatthias Springer memref::SubViewOp::inferRankReducedResultType( 50649e37000SMatthias Springer insertSliceOp.getSourceType().getRank(), dstMemrefType, 50749e37000SMatthias Springer mixedOffsets, mixedSizes, mixedStrides) 50849e37000SMatthias Springer .cast<MemRefType>(); 50949e37000SMatthias Springer Value subView = rewriter.create<memref::SubViewOp>( 51049e37000SMatthias Springer loc, subviewMemRefType, *dstMemref, mixedOffsets, mixedSizes, 51149e37000SMatthias Springer mixedStrides); 51249e37000SMatthias Springer 51349e37000SMatthias Springer // Copy tensor. If this tensor.insert_slice has a matching 51449e37000SMatthias Springer // tensor.extract_slice, the copy operation will eventually fold away. 51549e37000SMatthias Springer Value srcMemref = 51649e37000SMatthias Springer *state.getBuffer(rewriter, insertSliceOp->getOpOperand(0) /*source*/); 51749e37000SMatthias Springer if (failed(createMemCpy(rewriter, loc, srcMemref, subView, 51849e37000SMatthias Springer state.getOptions()))) 51949e37000SMatthias Springer return failure(); 52049e37000SMatthias Springer 52149e37000SMatthias Springer replaceOpWithBufferizedValues(rewriter, op, *dstMemref); 52249e37000SMatthias Springer return success(); 52349e37000SMatthias Springer } 52449e37000SMatthias Springer }; 52549e37000SMatthias Springer 526fc08d1c2SMatthias Springer /// Bufferization of tensor.rank. Replace with memref.rank. 527fc08d1c2SMatthias Springer struct RankOpInterface 528fc08d1c2SMatthias Springer : public BufferizableOpInterface::ExternalModel<RankOpInterface, 529fc08d1c2SMatthias Springer tensor::RankOp> { 530fc08d1c2SMatthias Springer bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand, 531fc08d1c2SMatthias Springer const BufferizationState &state) const { 532fc08d1c2SMatthias Springer return true; 533fc08d1c2SMatthias Springer } 534fc08d1c2SMatthias Springer 535fc08d1c2SMatthias Springer bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand, 536fc08d1c2SMatthias Springer const BufferizationState &state) const { 537fc08d1c2SMatthias Springer return false; 538fc08d1c2SMatthias Springer } 539fc08d1c2SMatthias Springer 540fc08d1c2SMatthias Springer OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand, 541fc08d1c2SMatthias Springer const BufferizationState &state) const { 542fc08d1c2SMatthias Springer return OpResult(); 543fc08d1c2SMatthias Springer } 544fc08d1c2SMatthias Springer 545fc08d1c2SMatthias Springer LogicalResult bufferize(Operation *op, RewriterBase &rewriter, 546fc08d1c2SMatthias Springer const BufferizationState &state) const { 547fc08d1c2SMatthias Springer auto rankOp = cast<tensor::RankOp>(op); 548fc08d1c2SMatthias Springer Value v = *state.getBuffer(rewriter, rankOp->getOpOperand(0) /*source*/); 549fc08d1c2SMatthias Springer replaceOpWithNewBufferizedOp<memref::RankOp>(rewriter, op, rankOp.getType(), 550fc08d1c2SMatthias Springer v); 551fc08d1c2SMatthias Springer return success(); 552fc08d1c2SMatthias Springer } 553fc08d1c2SMatthias Springer }; 554fc08d1c2SMatthias Springer 55549e37000SMatthias Springer } // namespace 55649e37000SMatthias Springer } // namespace tensor 55749e37000SMatthias Springer } // namespace mlir 55849e37000SMatthias Springer 55949e37000SMatthias Springer void mlir::tensor::registerBufferizableOpInterfaceExternalModels( 56049e37000SMatthias Springer DialectRegistry ®istry) { 56149e37000SMatthias Springer registry.addOpInterface<CastOp, CastOpInterface>(); 56249e37000SMatthias Springer registry.addOpInterface<DimOp, DimOpInterface>(); 56349e37000SMatthias Springer registry.addOpInterface<ExtractSliceOp, ExtractSliceOpInterface>(); 56449e37000SMatthias Springer registry.addOpInterface<ExtractOp, ExtractOpInterface>(); 565*71bbb78bSMatthias Springer registry.addOpInterface<GenerateOp, GenerateOpInterface>(); 56649e37000SMatthias Springer registry.addOpInterface<InsertOp, InsertOpInterface>(); 56749e37000SMatthias Springer registry.addOpInterface<InsertSliceOp, InsertSliceOpInterface>(); 568fc08d1c2SMatthias Springer registry.addOpInterface<RankOp, RankOpInterface>(); 56949e37000SMatthias Springer } 570