149e37000SMatthias Springer //===- BufferizableOpInterfaceImpl.cpp - Impl. of BufferizableOpInterface -===//
249e37000SMatthias Springer //
349e37000SMatthias Springer // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
449e37000SMatthias Springer // See https://llvm.org/LICENSE.txt for license information.
549e37000SMatthias Springer // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
649e37000SMatthias Springer //
749e37000SMatthias Springer //===----------------------------------------------------------------------===//
849e37000SMatthias Springer 
949e37000SMatthias Springer #include "mlir/Dialect/Tensor/Transforms/BufferizableOpInterfaceImpl.h"
1049e37000SMatthias Springer #include "mlir/Dialect/Bufferization/IR/BufferizableOpInterface.h"
1149e37000SMatthias Springer #include "mlir/Dialect/MemRef/IR/MemRef.h"
12*71bbb78bSMatthias Springer #include "mlir/Dialect/SCF/SCF.h"
1349e37000SMatthias Springer #include "mlir/Dialect/Tensor/IR/Tensor.h"
1449e37000SMatthias Springer #include "mlir/IR/Dialect.h"
1549e37000SMatthias Springer #include "mlir/IR/Operation.h"
1649e37000SMatthias Springer 
1749e37000SMatthias Springer using namespace mlir;
1849e37000SMatthias Springer using namespace mlir::bufferization;
1949e37000SMatthias Springer using namespace mlir::tensor;
2049e37000SMatthias Springer 
2149e37000SMatthias Springer namespace mlir {
2249e37000SMatthias Springer namespace tensor {
2349e37000SMatthias Springer namespace {
2449e37000SMatthias Springer 
2549e37000SMatthias Springer struct CastOpInterface
2649e37000SMatthias Springer     : public BufferizableOpInterface::ExternalModel<CastOpInterface,
2749e37000SMatthias Springer                                                     tensor::CastOp> {
2849e37000SMatthias Springer   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,
2949e37000SMatthias Springer                               const BufferizationState &state) const {
3049e37000SMatthias Springer     return false;
3149e37000SMatthias Springer   }
3249e37000SMatthias Springer 
3349e37000SMatthias Springer   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,
3449e37000SMatthias Springer                                const BufferizationState &state) const {
3549e37000SMatthias Springer     return false;
3649e37000SMatthias Springer   }
3749e37000SMatthias Springer 
3849e37000SMatthias Springer   OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand,
3949e37000SMatthias Springer                                const BufferizationState &state) const {
4049e37000SMatthias Springer     return op->getResult(0);
4149e37000SMatthias Springer   }
4249e37000SMatthias Springer 
4349e37000SMatthias Springer   BufferRelation bufferRelation(Operation *op, OpResult opResult,
4449e37000SMatthias Springer                                 const BufferizationState &state) const {
4549e37000SMatthias Springer     return BufferRelation::Equivalent;
4649e37000SMatthias Springer   }
4749e37000SMatthias Springer 
4849e37000SMatthias Springer   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,
4949e37000SMatthias Springer                           const BufferizationState &state) const {
5049e37000SMatthias Springer     auto castOp = cast<tensor::CastOp>(op);
5149e37000SMatthias Springer 
5249e37000SMatthias Springer     // The result buffer still has the old (pre-cast) type.
5349e37000SMatthias Springer     FailureOr<Value> resultBuffer =
5449e37000SMatthias Springer         state.getBuffer(rewriter, castOp->getOpOperand(0) /*source*/);
5549e37000SMatthias Springer     if (failed(resultBuffer))
5649e37000SMatthias Springer       return failure();
5749e37000SMatthias Springer     auto sourceMemRefType = resultBuffer->getType().cast<BaseMemRefType>();
5849e37000SMatthias Springer     Attribute memorySpace = sourceMemRefType.getMemorySpace();
5949e37000SMatthias Springer     TensorType resultTensorType =
6049e37000SMatthias Springer         castOp.getResult().getType().cast<TensorType>();
6149e37000SMatthias Springer     MemRefLayoutAttrInterface layout;
6249e37000SMatthias Springer 
6349e37000SMatthias Springer     if (auto rankedMemRefType = sourceMemRefType.dyn_cast<MemRefType>())
6449e37000SMatthias Springer       if (resultTensorType.isa<RankedTensorType>())
6549e37000SMatthias Springer         layout = rankedMemRefType.getLayout();
6649e37000SMatthias Springer 
6749e37000SMatthias Springer     // Compute the new memref type.
6849e37000SMatthias Springer     Type resultMemRefType;
6949e37000SMatthias Springer     if (resultTensorType.isa<RankedTensorType>()) {
7049e37000SMatthias Springer       resultMemRefType =
7149e37000SMatthias Springer           getContiguousMemRefType(resultTensorType, layout, memorySpace);
7249e37000SMatthias Springer     } else {
7349e37000SMatthias Springer       resultMemRefType =
7449e37000SMatthias Springer           getUnrankedMemRefType(resultTensorType.getElementType(), memorySpace);
7549e37000SMatthias Springer     }
7649e37000SMatthias Springer 
7749e37000SMatthias Springer     // Replace the op with a memref.cast.
7849e37000SMatthias Springer     assert(memref::CastOp::areCastCompatible(resultBuffer->getType(),
7949e37000SMatthias Springer                                              resultMemRefType) &&
8049e37000SMatthias Springer            "CallOp::bufferize: cast incompatible");
8149e37000SMatthias Springer     replaceOpWithNewBufferizedOp<memref::CastOp>(rewriter, op, resultMemRefType,
8249e37000SMatthias Springer                                                  *resultBuffer);
8349e37000SMatthias Springer 
8449e37000SMatthias Springer     return success();
8549e37000SMatthias Springer   }
8649e37000SMatthias Springer };
8749e37000SMatthias Springer 
8849e37000SMatthias Springer /// Bufferization of tensor.dim. Replace with memref.dim.
8949e37000SMatthias Springer struct DimOpInterface
9049e37000SMatthias Springer     : public BufferizableOpInterface::ExternalModel<DimOpInterface,
9149e37000SMatthias Springer                                                     tensor::DimOp> {
9249e37000SMatthias Springer   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,
9349e37000SMatthias Springer                               const BufferizationState &state) const {
9449e37000SMatthias Springer     return true;
9549e37000SMatthias Springer   }
9649e37000SMatthias Springer 
9749e37000SMatthias Springer   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,
9849e37000SMatthias Springer                                const BufferizationState &state) const {
9949e37000SMatthias Springer     return false;
10049e37000SMatthias Springer   }
10149e37000SMatthias Springer 
10249e37000SMatthias Springer   OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand,
10349e37000SMatthias Springer                                const BufferizationState &state) const {
10449e37000SMatthias Springer     return OpResult();
10549e37000SMatthias Springer   }
10649e37000SMatthias Springer 
10749e37000SMatthias Springer   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,
10849e37000SMatthias Springer                           const BufferizationState &state) const {
10949e37000SMatthias Springer     auto dimOp = cast<tensor::DimOp>(op);
11049e37000SMatthias Springer     Value v = *state.getBuffer(rewriter, dimOp->getOpOperand(0) /*source*/);
11149e37000SMatthias Springer     replaceOpWithNewBufferizedOp<memref::DimOp>(rewriter, op, v, dimOp.index());
11249e37000SMatthias Springer     return success();
11349e37000SMatthias Springer   }
11449e37000SMatthias Springer };
11549e37000SMatthias Springer 
11649e37000SMatthias Springer /// Bufferization of tensor.extract_slice. Replace with memref.subview.
11749e37000SMatthias Springer struct ExtractSliceOpInterface
11849e37000SMatthias Springer     : public BufferizableOpInterface::ExternalModel<ExtractSliceOpInterface,
11949e37000SMatthias Springer                                                     tensor::ExtractSliceOp> {
12049e37000SMatthias Springer   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,
12149e37000SMatthias Springer                               const BufferizationState &state) const {
12249e37000SMatthias Springer     return false;
12349e37000SMatthias Springer   }
12449e37000SMatthias Springer 
12549e37000SMatthias Springer   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,
12649e37000SMatthias Springer                                const BufferizationState &state) const {
12749e37000SMatthias Springer     return false;
12849e37000SMatthias Springer   }
12949e37000SMatthias Springer 
13049e37000SMatthias Springer   OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand,
13149e37000SMatthias Springer                                const BufferizationState &state) const {
13249e37000SMatthias Springer     return &opOperand == &op->getOpOperand(0) /*source*/
13349e37000SMatthias Springer                ? op->getResult(0)
13449e37000SMatthias Springer                : OpResult();
13549e37000SMatthias Springer   }
13649e37000SMatthias Springer 
13749e37000SMatthias Springer   BufferRelation bufferRelation(Operation *op, OpResult opResult,
13849e37000SMatthias Springer                                 const BufferizationState &state) const {
13949e37000SMatthias Springer     return BufferRelation::None;
14049e37000SMatthias Springer   }
14149e37000SMatthias Springer 
14249e37000SMatthias Springer   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,
14349e37000SMatthias Springer                           const BufferizationState &state) const {
14449e37000SMatthias Springer     auto extractSliceOp = cast<tensor::ExtractSliceOp>(op);
14549e37000SMatthias Springer     Location loc = extractSliceOp.getLoc();
14649e37000SMatthias Springer     Value srcMemref =
14749e37000SMatthias Springer         *state.getBuffer(rewriter, extractSliceOp->getOpOperand(0) /*source*/,
14849e37000SMatthias Springer                          /*forceInPlace=*/true);
14949e37000SMatthias Springer     auto srcMemrefType = srcMemref.getType().cast<MemRefType>();
15049e37000SMatthias Springer     auto dstTensorType =
15149e37000SMatthias Springer         extractSliceOp.result().getType().cast<RankedTensorType>();
15249e37000SMatthias Springer 
15349e37000SMatthias Springer     // If not inplaceable, alloc.
15449e37000SMatthias Springer     bool inplace = state.isInPlace(extractSliceOp->getOpOperand(0));
15549e37000SMatthias Springer     Value alloc;
15649e37000SMatthias Springer     if (!inplace) {
15749e37000SMatthias Springer       FailureOr<Value> allocOrFailure =
15849e37000SMatthias Springer           createAlloc(rewriter, loc, extractSliceOp.result(),
15949e37000SMatthias Springer                       state.getOptions().createDeallocs, state.getOptions());
16049e37000SMatthias Springer       if (failed(allocOrFailure))
16149e37000SMatthias Springer         return failure();
16249e37000SMatthias Springer       alloc = *allocOrFailure;
16349e37000SMatthias Springer     }
16449e37000SMatthias Springer 
16549e37000SMatthias Springer     // Expand offsets, sizes and strides to the full rank to handle the
16649e37000SMatthias Springer     // rank-reducing case.
16749e37000SMatthias Springer     SmallVector<OpFoldResult> mixedOffsets = extractSliceOp.getMixedOffsets();
16849e37000SMatthias Springer     SmallVector<OpFoldResult> mixedSizes = extractSliceOp.getMixedSizes();
16949e37000SMatthias Springer     SmallVector<OpFoldResult> mixedStrides = extractSliceOp.getMixedStrides();
17049e37000SMatthias Springer     OffsetSizeAndStrideOpInterface::expandToRank(
17149e37000SMatthias Springer         srcMemref, mixedOffsets, mixedSizes, mixedStrides,
17249e37000SMatthias Springer         [&](Value target, int64_t dim) -> OpFoldResult {
17349e37000SMatthias Springer           auto shapedType = target.getType().cast<ShapedType>();
17449e37000SMatthias Springer           if (shapedType.isDynamicDim(dim))
17549e37000SMatthias Springer             return rewriter.create<memref::DimOp>(loc, target, dim).result();
17649e37000SMatthias Springer           return rewriter.getIndexAttr(shapedType.getDimSize(dim));
17749e37000SMatthias Springer         });
17849e37000SMatthias Springer     // Bufferize to subview.
17949e37000SMatthias Springer     auto subviewMemRefType = memref::SubViewOp::inferRankReducedResultType(
18049e37000SMatthias Springer                                  dstTensorType.getRank(), srcMemrefType,
18149e37000SMatthias Springer                                  mixedOffsets, mixedSizes, mixedStrides)
18249e37000SMatthias Springer                                  .cast<MemRefType>();
18349e37000SMatthias Springer     Value subView = rewriter.create<memref::SubViewOp>(
18449e37000SMatthias Springer         loc, subviewMemRefType, srcMemref, mixedOffsets, mixedSizes,
18549e37000SMatthias Springer         mixedStrides);
18649e37000SMatthias Springer 
18749e37000SMatthias Springer     // If not inplaceable, copy.
18849e37000SMatthias Springer     if (!inplace) {
18949e37000SMatthias Springer       // Do not copy if the copied data is never read.
19049e37000SMatthias Springer       if (state.isValueRead(extractSliceOp.result()))
19149e37000SMatthias Springer         if (failed(createMemCpy(rewriter, extractSliceOp.getLoc(), subView,
19249e37000SMatthias Springer                                 alloc, state.getOptions())))
19349e37000SMatthias Springer           return failure();
19449e37000SMatthias Springer       subView = alloc;
19549e37000SMatthias Springer     }
19649e37000SMatthias Springer 
19749e37000SMatthias Springer     replaceOpWithBufferizedValues(rewriter, op, subView);
19849e37000SMatthias Springer     return success();
19949e37000SMatthias Springer   }
20049e37000SMatthias Springer };
20149e37000SMatthias Springer 
20249e37000SMatthias Springer /// Bufferization of tensor.extract. Replace with memref.load.
20349e37000SMatthias Springer struct ExtractOpInterface
20449e37000SMatthias Springer     : public BufferizableOpInterface::ExternalModel<ExtractOpInterface,
20549e37000SMatthias Springer                                                     tensor::ExtractOp> {
20649e37000SMatthias Springer   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,
20749e37000SMatthias Springer                               const BufferizationState &state) const {
20849e37000SMatthias Springer     return true;
20949e37000SMatthias Springer   }
21049e37000SMatthias Springer 
21149e37000SMatthias Springer   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,
21249e37000SMatthias Springer                                const BufferizationState &state) const {
21349e37000SMatthias Springer     return false;
21449e37000SMatthias Springer   }
21549e37000SMatthias Springer 
21649e37000SMatthias Springer   OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand,
21749e37000SMatthias Springer                                const BufferizationState &state) const {
21849e37000SMatthias Springer     return OpResult();
21949e37000SMatthias Springer   }
22049e37000SMatthias Springer 
22149e37000SMatthias Springer   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,
22249e37000SMatthias Springer                           const BufferizationState &state) const {
22349e37000SMatthias Springer     auto extractOp = cast<tensor::ExtractOp>(op);
22449e37000SMatthias Springer     Value srcMemref =
22549e37000SMatthias Springer         *state.getBuffer(rewriter, extractOp->getOpOperand(0) /*tensor*/);
22649e37000SMatthias Springer     replaceOpWithNewBufferizedOp<memref::LoadOp>(rewriter, op, srcMemref,
22749e37000SMatthias Springer                                                  extractOp.indices());
22849e37000SMatthias Springer     return success();
22949e37000SMatthias Springer   }
23049e37000SMatthias Springer };
23149e37000SMatthias Springer 
232*71bbb78bSMatthias Springer /// Bufferization of tensor.generate.
233*71bbb78bSMatthias Springer struct GenerateOpInterface
234*71bbb78bSMatthias Springer     : public BufferizableOpInterface::ExternalModel<GenerateOpInterface,
235*71bbb78bSMatthias Springer                                                     tensor::GenerateOp> {
236*71bbb78bSMatthias Springer   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,
237*71bbb78bSMatthias Springer                           const BufferizationState &state) const {
238*71bbb78bSMatthias Springer     auto generateOp = cast<tensor::GenerateOp>(op);
239*71bbb78bSMatthias Springer 
240*71bbb78bSMatthias Springer     // Allocate memory.
241*71bbb78bSMatthias Springer     Location loc = op->getLoc();
242*71bbb78bSMatthias Springer     MemRefType memrefType =
243*71bbb78bSMatthias Springer         getContiguousMemRefType(generateOp.getType().cast<RankedTensorType>());
244*71bbb78bSMatthias Springer     FailureOr<Value> maybeResult =
245*71bbb78bSMatthias Springer         createAlloc(rewriter, loc, memrefType, generateOp.dynamicExtents(),
246*71bbb78bSMatthias Springer                     /*deallocMemref=*/state.getOptions().createDeallocs,
247*71bbb78bSMatthias Springer                     state.getOptions());
248*71bbb78bSMatthias Springer     if (failed(maybeResult))
249*71bbb78bSMatthias Springer       return failure();
250*71bbb78bSMatthias Springer     Value result = *maybeResult;
251*71bbb78bSMatthias Springer 
252*71bbb78bSMatthias Springer     // Collect loop bounds.
253*71bbb78bSMatthias Springer     int64_t rank = memrefType.getRank();
254*71bbb78bSMatthias Springer     Value zero = rewriter.create<arith::ConstantIndexOp>(loc, 0);
255*71bbb78bSMatthias Springer     Value one = rewriter.create<arith::ConstantIndexOp>(loc, 1);
256*71bbb78bSMatthias Springer     SmallVector<Value, 4> lowerBounds(rank, zero);
257*71bbb78bSMatthias Springer     SmallVector<Value, 4> steps(rank, one);
258*71bbb78bSMatthias Springer     SmallVector<Value, 4> upperBounds;
259*71bbb78bSMatthias Springer     int nextDynamicIndex = 0;
260*71bbb78bSMatthias Springer     for (int i = 0; i < rank; i++) {
261*71bbb78bSMatthias Springer       Value upperBound = memrefType.isDynamicDim(i)
262*71bbb78bSMatthias Springer                              ? generateOp.dynamicExtents()[nextDynamicIndex++]
263*71bbb78bSMatthias Springer                              : rewriter.create<arith::ConstantIndexOp>(
264*71bbb78bSMatthias Springer                                    loc, memrefType.getDimSize(i));
265*71bbb78bSMatthias Springer       upperBounds.push_back(upperBound);
266*71bbb78bSMatthias Springer     }
267*71bbb78bSMatthias Springer 
268*71bbb78bSMatthias Springer     // Generate tensor elements with a parallel loop that stores into
269*71bbb78bSMatthias Springer     // each element of the resulting memref. We use mergeBlockBefore to "move"
270*71bbb78bSMatthias Springer     // this op's body into the scf.parallel's body.
271*71bbb78bSMatthias Springer     auto parallel =
272*71bbb78bSMatthias Springer         rewriter.create<scf::ParallelOp>(loc, lowerBounds, upperBounds, steps);
273*71bbb78bSMatthias Springer     Block *parallelBody = parallel.getBody();
274*71bbb78bSMatthias Springer     rewriter.mergeBlockBefore(generateOp.getBody(),
275*71bbb78bSMatthias Springer                               parallelBody->getTerminator(),
276*71bbb78bSMatthias Springer                               parallelBody->getArguments());
277*71bbb78bSMatthias Springer     // Replace the inlined yield op with a store op. The scf.parallel's builder
278*71bbb78bSMatthias Springer     // already populated an scf.yield at the end, so we don't need to worry
279*71bbb78bSMatthias Springer     // about creating that.
280*71bbb78bSMatthias Springer     Operation *elementYield = parallelBody->getTerminator()->getPrevNode();
281*71bbb78bSMatthias Springer     rewriter.setInsertionPointAfter(elementYield);
282*71bbb78bSMatthias Springer     rewriter.replaceOpWithNewOp<memref::StoreOp>(
283*71bbb78bSMatthias Springer         elementYield, elementYield->getOperands()[0], result,
284*71bbb78bSMatthias Springer         parallelBody->getArguments());
285*71bbb78bSMatthias Springer 
286*71bbb78bSMatthias Springer     replaceOpWithBufferizedValues(rewriter, op, result);
287*71bbb78bSMatthias Springer     return success();
288*71bbb78bSMatthias Springer   }
289*71bbb78bSMatthias Springer };
290*71bbb78bSMatthias Springer 
29149e37000SMatthias Springer /// Bufferization of tensor.insert. Replace with memref.store.
29249e37000SMatthias Springer struct InsertOpInterface
29349e37000SMatthias Springer     : public BufferizableOpInterface::ExternalModel<InsertOpInterface,
29449e37000SMatthias Springer                                                     tensor::InsertOp> {
29549e37000SMatthias Springer   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,
29649e37000SMatthias Springer                               const BufferizationState &state) const {
29749e37000SMatthias Springer     return true;
29849e37000SMatthias Springer   }
29949e37000SMatthias Springer 
30049e37000SMatthias Springer   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,
30149e37000SMatthias Springer                                const BufferizationState &state) const {
30249e37000SMatthias Springer     return true;
30349e37000SMatthias Springer   }
30449e37000SMatthias Springer 
30549e37000SMatthias Springer   OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand,
30649e37000SMatthias Springer                                const BufferizationState &state) const {
30749e37000SMatthias Springer     assert(&opOperand == &op->getOpOperand(1) /*dest*/ &&
30849e37000SMatthias Springer            "expected dest OpOperand");
30949e37000SMatthias Springer     return op->getOpResult(0);
31049e37000SMatthias Springer   }
31149e37000SMatthias Springer 
31249e37000SMatthias Springer   SmallVector<OpOperand *>
31349e37000SMatthias Springer   getAliasingOpOperand(Operation *op, OpResult opResult,
31449e37000SMatthias Springer                        const BufferizationState &state) const {
31549e37000SMatthias Springer     return {&op->getOpOperand(1) /*dest*/};
31649e37000SMatthias Springer   }
31749e37000SMatthias Springer 
31849e37000SMatthias Springer   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,
31949e37000SMatthias Springer                           const BufferizationState &state) const {
32049e37000SMatthias Springer     auto insertOp = cast<tensor::InsertOp>(op);
32149e37000SMatthias Springer     FailureOr<Value> destMemref =
32249e37000SMatthias Springer         state.getBuffer(rewriter, insertOp->getOpOperand(1) /*dest*/);
32349e37000SMatthias Springer     if (failed(destMemref))
32449e37000SMatthias Springer       return failure();
32549e37000SMatthias Springer     rewriter.create<memref::StoreOp>(insertOp.getLoc(), insertOp.scalar(),
32649e37000SMatthias Springer                                      *destMemref, insertOp.indices());
32749e37000SMatthias Springer     replaceOpWithBufferizedValues(rewriter, op, *destMemref);
32849e37000SMatthias Springer     return success();
32949e37000SMatthias Springer   }
33049e37000SMatthias Springer 
33149e37000SMatthias Springer   BufferRelation bufferRelation(Operation *op, OpResult opResult,
33249e37000SMatthias Springer                                 const BufferizationState &state) const {
33349e37000SMatthias Springer     return BufferRelation::Equivalent;
33449e37000SMatthias Springer   }
33549e37000SMatthias Springer };
33649e37000SMatthias Springer 
33749e37000SMatthias Springer /// Return true if the (ExtractSliceOp, InsertSliceOp) pair match (i.e.
33849e37000SMatthias Springer /// equivalent operand / result and same offset/sizes/strides specification).
33949e37000SMatthias Springer ///
34049e37000SMatthias Springer /// This is one particular type of relationship between ops on tensors that
34149e37000SMatthias Springer /// reduce to an equivalence on buffers. This should be generalized and
34249e37000SMatthias Springer /// exposed as interfaces on the proper types.
34349e37000SMatthias Springer static bool areEquivalentExtractSliceOps(const BufferizationState &state,
34449e37000SMatthias Springer                                          ExtractSliceOp st, InsertSliceOp sti) {
34549e37000SMatthias Springer   if (!st || !sti)
34649e37000SMatthias Springer     return false;
34749e37000SMatthias Springer   if (sti != sti &&
34849e37000SMatthias Springer       !state.areEquivalentBufferizedValues(st.source(), sti.dest()))
34949e37000SMatthias Springer     return false;
35049e37000SMatthias Springer   if (!sameOffsetsSizesAndStrides(st, sti, isEqualConstantIntOrValue))
35149e37000SMatthias Springer     return false;
35249e37000SMatthias Springer   return true;
35349e37000SMatthias Springer }
35449e37000SMatthias Springer 
35549e37000SMatthias Springer /// Return true if `value` is originating from an ExtractSliceOp that matches
35649e37000SMatthias Springer /// the given InsertSliceOp.
35749e37000SMatthias Springer static bool hasMatchingExtractSliceOp(const BufferizationState &state,
35849e37000SMatthias Springer                                       Value value, InsertSliceOp insertOp) {
35949e37000SMatthias Springer   auto condition = [&](Value val) {
36049e37000SMatthias Springer     if (auto extractOp = val.getDefiningOp<ExtractSliceOp>())
36149e37000SMatthias Springer       if (areEquivalentExtractSliceOps(state, extractOp, insertOp))
36249e37000SMatthias Springer         return true;
36349e37000SMatthias Springer     return false;
36449e37000SMatthias Springer   };
36549e37000SMatthias Springer 
36649e37000SMatthias Springer   return llvm::all_of(state.findValueInReverseUseDefChain(value, condition),
36749e37000SMatthias Springer                       condition);
36849e37000SMatthias Springer }
36949e37000SMatthias Springer 
37049e37000SMatthias Springer /// Bufferization of tensor.insert_slice. Replace with a memory copy. Under
37149e37000SMatthias Springer /// certain circumstances, this op can also be a no-op.
37249e37000SMatthias Springer struct InsertSliceOpInterface
37349e37000SMatthias Springer     : public BufferizableOpInterface::ExternalModel<InsertSliceOpInterface,
37449e37000SMatthias Springer                                                     tensor::InsertSliceOp> {
37549e37000SMatthias Springer   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,
37649e37000SMatthias Springer                               const BufferizationState &state) const {
37749e37000SMatthias Springer     return true;
37849e37000SMatthias Springer   }
37949e37000SMatthias Springer 
38049e37000SMatthias Springer   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,
38149e37000SMatthias Springer                                const BufferizationState &state) const {
38249e37000SMatthias Springer     return &opOperand == &op->getOpOperand(1) /*dest*/;
38349e37000SMatthias Springer   }
38449e37000SMatthias Springer 
38549e37000SMatthias Springer   OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand,
38649e37000SMatthias Springer                                const BufferizationState &state) const {
38749e37000SMatthias Springer     return &opOperand == &op->getOpOperand(1) /*dest*/
38849e37000SMatthias Springer                ? op->getResult(0)
38949e37000SMatthias Springer                : OpResult();
39049e37000SMatthias Springer   }
39149e37000SMatthias Springer 
39249e37000SMatthias Springer   BufferRelation bufferRelation(Operation *op, OpResult opResult,
39349e37000SMatthias Springer                                 const BufferizationState &state) const {
39449e37000SMatthias Springer     return BufferRelation::Equivalent;
39549e37000SMatthias Springer   }
39649e37000SMatthias Springer 
39749e37000SMatthias Springer   bool isNotConflicting(Operation *op, OpOperand *uRead,
39849e37000SMatthias Springer                         OpOperand *uConflictingWrite,
39949e37000SMatthias Springer                         const BufferizationState &state) const {
40049e37000SMatthias Springer     Operation *readingOp = uRead->getOwner();
40149e37000SMatthias Springer     Operation *conflictingWritingOp = uConflictingWrite->getOwner();
40249e37000SMatthias Springer 
40349e37000SMatthias Springer     // Special rules for matching ExtractSliceOp/InsertSliceOp pairs. If
40449e37000SMatthias Springer     // uRead is an InsertSliceOp...
40549e37000SMatthias Springer     if (auto insertSliceOp = dyn_cast<InsertSliceOp>(readingOp)) {
40649e37000SMatthias Springer       // As an example, consider the following IR.
40749e37000SMatthias Springer       //
40849e37000SMatthias Springer       // %0 = tensor.extract_slice %t[%a, %b][%c, %d][1, 1] {inplace = [true] }
40949e37000SMatthias Springer       // %1 = linalg.fill %cst, %0 {inplace= [true] }
41049e37000SMatthias Springer       // %2 = tensor.insert_slice %1 into %t[%a, %b][%c, %d][1, 1]
41149e37000SMatthias Springer       //     {inplace= [true] }
41249e37000SMatthias Springer 
41349e37000SMatthias Springer       // TODO: Use insertSliceOp.getDestOpOperand etc. when available.
41449e37000SMatthias Springer       if (uRead == &insertSliceOp->getOpOperand(1) /*dest*/ &&
41549e37000SMatthias Springer           hasMatchingExtractSliceOp(state, uConflictingWrite->get(),
41649e37000SMatthias Springer                                     insertSliceOp))
41749e37000SMatthias Springer         // Case 1: The main insight is that InsertSliceOp reads only part of
41849e37000SMatthias Springer         // the destination tensor. The overwritten area is not read. If
41949e37000SMatthias Springer         // uConflictingWrite writes into exactly the memory location that is
42049e37000SMatthias Springer         // being read by uRead, this is not a conflict.
42149e37000SMatthias Springer         //
42249e37000SMatthias Springer         // In the above example:
42349e37000SMatthias Springer         // uRead             = OpOperand 1 (%t) of tensor.insert_slice
42449e37000SMatthias Springer         // uConflictingWrite = OpOperand 1 (%0) of linalg.fill
42549e37000SMatthias Springer         //
42649e37000SMatthias Springer         // The read of %t does not conflict with the write of the FillOp
42749e37000SMatthias Springer         // (same aliases!) because the area that the FillOp operates on is
42849e37000SMatthias Springer         // exactly the one that is *not* read via %t.
42949e37000SMatthias Springer         return true;
43049e37000SMatthias Springer 
43149e37000SMatthias Springer       if (uRead == &insertSliceOp->getOpOperand(0) /*source*/ &&
43249e37000SMatthias Springer           uConflictingWrite == &insertSliceOp->getOpOperand(1) /*dest*/ &&
43349e37000SMatthias Springer           hasMatchingExtractSliceOp(state, uRead->get(), insertSliceOp))
43449e37000SMatthias Springer         // Case 2: The read of the source tensor and the write to the dest
43549e37000SMatthias Springer         // tensor via an InsertSliceOp is not a conflict if the read is
43649e37000SMatthias Springer         // reading exactly that part of an equivalent tensor that the
43749e37000SMatthias Springer         // InsertSliceOp is writing.
43849e37000SMatthias Springer         //
43949e37000SMatthias Springer         // In the above example:
44049e37000SMatthias Springer         // uRead             = OpOperand 0 (%1) of tensor.insert_slice
44149e37000SMatthias Springer         // uConflictingWrite = OpOperand 1 (%t) of tensor.insert_slice
44249e37000SMatthias Springer         return true;
44349e37000SMatthias Springer     }
44449e37000SMatthias Springer 
44549e37000SMatthias Springer     // If uConflictingWrite is an InsertSliceOp...
44649e37000SMatthias Springer     if (auto insertSliceOp = dyn_cast<InsertSliceOp>(conflictingWritingOp))
44749e37000SMatthias Springer       // As an example, consider the following IR.
44849e37000SMatthias Springer       //
44949e37000SMatthias Springer       // %0 = tensor.extract_slice %t[%a, %b][%c, %d][1, 1] {inplace = [true] }
45049e37000SMatthias Springer       // %1 = linalg.fill %cst, %0 {inplace= [true] }
45149e37000SMatthias Springer       // %2 = tensor.insert_slice %1 into %t[%a, %b][%c, %d][1, 1]
45249e37000SMatthias Springer       //     {inplace= [true] }
45349e37000SMatthias Springer       // %3 = vector.transfer_read %1, %cst
45449e37000SMatthias Springer       //
45549e37000SMatthias Springer       // In the above example:
45649e37000SMatthias Springer       // uRead             = OpOperand 0 (%1) of vector.transfer_read
45749e37000SMatthias Springer       // uConflictingWrite = OpOperand 1 (%t) of tensor.insert_slice
45849e37000SMatthias Springer       // lastWrite         = %1
45949e37000SMatthias Springer       //
46049e37000SMatthias Springer       // This is not a conflict because the InsertSliceOp overwrites the
46149e37000SMatthias Springer       // memory segment of %1 with the exact same data. (Effectively, there
46249e37000SMatthias Springer       // is no memory write here.)
46349e37000SMatthias Springer       if (uConflictingWrite == &insertSliceOp->getOpOperand(1) /*dest*/ &&
46449e37000SMatthias Springer           state.areEquivalentBufferizedValues(uRead->get(),
46549e37000SMatthias Springer                                               insertSliceOp.source()) &&
46649e37000SMatthias Springer           hasMatchingExtractSliceOp(state, insertSliceOp.source(),
46749e37000SMatthias Springer                                     insertSliceOp))
46849e37000SMatthias Springer         return true;
46949e37000SMatthias Springer 
47049e37000SMatthias Springer     return false;
47149e37000SMatthias Springer   }
47249e37000SMatthias Springer 
47349e37000SMatthias Springer   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,
47449e37000SMatthias Springer                           const BufferizationState &state) const {
47549e37000SMatthias Springer     // insert_slice ops arise from tiling and bufferizing them out-of-place is
47649e37000SMatthias Springer     // generally a deal breaker. When used with loops, this ends up cloning the
47749e37000SMatthias Springer     // whole tensor on every single iteration and is a symptom of a
47849e37000SMatthias Springer     // catastrophically bad scheduling decision.
47949e37000SMatthias Springer     // TODO: be very loud about it or even consider failing the pass.
48049e37000SMatthias Springer     auto insertSliceOp = cast<tensor::InsertSliceOp>(op);
48149e37000SMatthias Springer     Location loc = insertSliceOp.getLoc();
48249e37000SMatthias Springer 
48349e37000SMatthias Springer     // When bufferizing out-of-place, `getResultBuffer` allocates.
48449e37000SMatthias Springer     FailureOr<Value> dstMemref =
48549e37000SMatthias Springer         state.getBuffer(rewriter, insertSliceOp->getOpOperand(1) /*dest*/);
48649e37000SMatthias Springer     if (failed(dstMemref))
48749e37000SMatthias Springer       return failure();
48849e37000SMatthias Springer 
48949e37000SMatthias Springer     // Expand offsets, sizes and strides to the full rank to handle the
49049e37000SMatthias Springer     // rank-reducing case.
49149e37000SMatthias Springer     SmallVector<OpFoldResult> mixedOffsets = insertSliceOp.getMixedOffsets();
49249e37000SMatthias Springer     SmallVector<OpFoldResult> mixedSizes = insertSliceOp.getMixedSizes();
49349e37000SMatthias Springer     SmallVector<OpFoldResult> mixedStrides = insertSliceOp.getMixedStrides();
49449e37000SMatthias Springer     OffsetSizeAndStrideOpInterface::expandToRank(
49549e37000SMatthias Springer         *dstMemref, mixedOffsets, mixedSizes, mixedStrides,
49649e37000SMatthias Springer         [&](Value target, int64_t dim) -> OpFoldResult {
49749e37000SMatthias Springer           auto shapedType = target.getType().cast<ShapedType>();
49849e37000SMatthias Springer           if (shapedType.isDynamicDim(dim))
49949e37000SMatthias Springer             return rewriter.create<memref::DimOp>(loc, target, dim).result();
50049e37000SMatthias Springer           return rewriter.getIndexAttr(shapedType.getDimSize(dim));
50149e37000SMatthias Springer         });
50249e37000SMatthias Springer     // Take a subview of the dst.
50349e37000SMatthias Springer     auto dstMemrefType = dstMemref->getType().cast<MemRefType>();
50449e37000SMatthias Springer     auto subviewMemRefType =
50549e37000SMatthias Springer         memref::SubViewOp::inferRankReducedResultType(
50649e37000SMatthias Springer             insertSliceOp.getSourceType().getRank(), dstMemrefType,
50749e37000SMatthias Springer             mixedOffsets, mixedSizes, mixedStrides)
50849e37000SMatthias Springer             .cast<MemRefType>();
50949e37000SMatthias Springer     Value subView = rewriter.create<memref::SubViewOp>(
51049e37000SMatthias Springer         loc, subviewMemRefType, *dstMemref, mixedOffsets, mixedSizes,
51149e37000SMatthias Springer         mixedStrides);
51249e37000SMatthias Springer 
51349e37000SMatthias Springer     // Copy tensor. If this tensor.insert_slice has a matching
51449e37000SMatthias Springer     // tensor.extract_slice, the copy operation will eventually fold away.
51549e37000SMatthias Springer     Value srcMemref =
51649e37000SMatthias Springer         *state.getBuffer(rewriter, insertSliceOp->getOpOperand(0) /*source*/);
51749e37000SMatthias Springer     if (failed(createMemCpy(rewriter, loc, srcMemref, subView,
51849e37000SMatthias Springer                             state.getOptions())))
51949e37000SMatthias Springer       return failure();
52049e37000SMatthias Springer 
52149e37000SMatthias Springer     replaceOpWithBufferizedValues(rewriter, op, *dstMemref);
52249e37000SMatthias Springer     return success();
52349e37000SMatthias Springer   }
52449e37000SMatthias Springer };
52549e37000SMatthias Springer 
526fc08d1c2SMatthias Springer /// Bufferization of tensor.rank. Replace with memref.rank.
527fc08d1c2SMatthias Springer struct RankOpInterface
528fc08d1c2SMatthias Springer     : public BufferizableOpInterface::ExternalModel<RankOpInterface,
529fc08d1c2SMatthias Springer                                                     tensor::RankOp> {
530fc08d1c2SMatthias Springer   bool bufferizesToMemoryRead(Operation *op, OpOperand &opOperand,
531fc08d1c2SMatthias Springer                               const BufferizationState &state) const {
532fc08d1c2SMatthias Springer     return true;
533fc08d1c2SMatthias Springer   }
534fc08d1c2SMatthias Springer 
535fc08d1c2SMatthias Springer   bool bufferizesToMemoryWrite(Operation *op, OpOperand &opOperand,
536fc08d1c2SMatthias Springer                                const BufferizationState &state) const {
537fc08d1c2SMatthias Springer     return false;
538fc08d1c2SMatthias Springer   }
539fc08d1c2SMatthias Springer 
540fc08d1c2SMatthias Springer   OpResult getAliasingOpResult(Operation *op, OpOperand &opOperand,
541fc08d1c2SMatthias Springer                                const BufferizationState &state) const {
542fc08d1c2SMatthias Springer     return OpResult();
543fc08d1c2SMatthias Springer   }
544fc08d1c2SMatthias Springer 
545fc08d1c2SMatthias Springer   LogicalResult bufferize(Operation *op, RewriterBase &rewriter,
546fc08d1c2SMatthias Springer                           const BufferizationState &state) const {
547fc08d1c2SMatthias Springer     auto rankOp = cast<tensor::RankOp>(op);
548fc08d1c2SMatthias Springer     Value v = *state.getBuffer(rewriter, rankOp->getOpOperand(0) /*source*/);
549fc08d1c2SMatthias Springer     replaceOpWithNewBufferizedOp<memref::RankOp>(rewriter, op, rankOp.getType(),
550fc08d1c2SMatthias Springer                                                  v);
551fc08d1c2SMatthias Springer     return success();
552fc08d1c2SMatthias Springer   }
553fc08d1c2SMatthias Springer };
554fc08d1c2SMatthias Springer 
55549e37000SMatthias Springer } // namespace
55649e37000SMatthias Springer } // namespace tensor
55749e37000SMatthias Springer } // namespace mlir
55849e37000SMatthias Springer 
55949e37000SMatthias Springer void mlir::tensor::registerBufferizableOpInterfaceExternalModels(
56049e37000SMatthias Springer     DialectRegistry &registry) {
56149e37000SMatthias Springer   registry.addOpInterface<CastOp, CastOpInterface>();
56249e37000SMatthias Springer   registry.addOpInterface<DimOp, DimOpInterface>();
56349e37000SMatthias Springer   registry.addOpInterface<ExtractSliceOp, ExtractSliceOpInterface>();
56449e37000SMatthias Springer   registry.addOpInterface<ExtractOp, ExtractOpInterface>();
565*71bbb78bSMatthias Springer   registry.addOpInterface<GenerateOp, GenerateOpInterface>();
56649e37000SMatthias Springer   registry.addOpInterface<InsertOp, InsertOpInterface>();
56749e37000SMatthias Springer   registry.addOpInterface<InsertSliceOp, InsertSliceOpInterface>();
568fc08d1c2SMatthias Springer   registry.addOpInterface<RankOp, RankOpInterface>();
56949e37000SMatthias Springer }
570