15c0c51a9SNicolas Vasilache //===- VectorToLLVM.cpp - Conversion from Vector to the LLVM dialect ------===//
25c0c51a9SNicolas Vasilache //
330857107SMehdi Amini // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
456222a06SMehdi Amini // See https://llvm.org/LICENSE.txt for license information.
556222a06SMehdi Amini // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
65c0c51a9SNicolas Vasilache //
756222a06SMehdi Amini //===----------------------------------------------------------------------===//
85c0c51a9SNicolas Vasilache 
965678d93SNicolas Vasilache #include "mlir/Conversion/VectorToLLVM/ConvertVectorToLLVM.h"
10870c1fd4SAlex Zinenko 
1175e5f0aaSAlex Zinenko #include "mlir/Conversion/LLVMCommon/VectorPattern.h"
12a54f4eaeSMogball #include "mlir/Dialect/Arithmetic/IR/Arithmetic.h"
13a75a46dbSJavier Setoain #include "mlir/Dialect/Arithmetic/Utils/Utils.h"
14e332c22cSNicolas Vasilache #include "mlir/Dialect/LLVMIR/FunctionCallUtils.h"
155c0c51a9SNicolas Vasilache #include "mlir/Dialect/LLVMIR/LLVMDialect.h"
16e2310704SJulian Gross #include "mlir/Dialect/MemRef/IR/MemRef.h"
1799ef9eebSMatthias Springer #include "mlir/Dialect/Vector/Transforms/VectorTransforms.h"
1809f7a55fSRiver Riddle #include "mlir/IR/BuiltinTypes.h"
198fe076ffSThomas Raoux #include "mlir/IR/TypeUtilities.h"
2029a50c58SStephen Neuendorffer #include "mlir/Support/MathExtras.h"
21929189a4SWilliam S. Moses #include "mlir/Target/LLVMIR/TypeToLLVM.h"
225c0c51a9SNicolas Vasilache #include "mlir/Transforms/DialectConversion.h"
235c0c51a9SNicolas Vasilache 
245c0c51a9SNicolas Vasilache using namespace mlir;
2565678d93SNicolas Vasilache using namespace mlir::vector;
265c0c51a9SNicolas Vasilache 
279826fe5cSAart Bik // Helper to reduce vector type by one rank at front.
reducedVectorTypeFront(VectorType tp)289826fe5cSAart Bik static VectorType reducedVectorTypeFront(VectorType tp) {
299826fe5cSAart Bik   assert((tp.getRank() > 1) && "unlowerable vector type");
30a4830d14SJavier Setoain   unsigned numScalableDims = tp.getNumScalableDims();
31a4830d14SJavier Setoain   if (tp.getShape().size() == numScalableDims)
32a4830d14SJavier Setoain     --numScalableDims;
33a4830d14SJavier Setoain   return VectorType::get(tp.getShape().drop_front(), tp.getElementType(),
34a4830d14SJavier Setoain                          numScalableDims);
359826fe5cSAart Bik }
369826fe5cSAart Bik 
379826fe5cSAart Bik // Helper to reduce vector type by *all* but one rank at back.
reducedVectorTypeBack(VectorType tp)389826fe5cSAart Bik static VectorType reducedVectorTypeBack(VectorType tp) {
399826fe5cSAart Bik   assert((tp.getRank() > 1) && "unlowerable vector type");
40a4830d14SJavier Setoain   unsigned numScalableDims = tp.getNumScalableDims();
41a4830d14SJavier Setoain   if (numScalableDims > 0)
42a4830d14SJavier Setoain     --numScalableDims;
43a4830d14SJavier Setoain   return VectorType::get(tp.getShape().take_back(), tp.getElementType(),
44a4830d14SJavier Setoain                          numScalableDims);
459826fe5cSAart Bik }
469826fe5cSAart Bik 
471c81adf3SAart Bik // Helper that picks the proper sequence for inserting.
insertOne(ConversionPatternRewriter & rewriter,LLVMTypeConverter & typeConverter,Location loc,Value val1,Value val2,Type llvmType,int64_t rank,int64_t pos)48e62a6956SRiver Riddle static Value insertOne(ConversionPatternRewriter &rewriter,
490f04384dSAlex Zinenko                        LLVMTypeConverter &typeConverter, Location loc,
500f04384dSAlex Zinenko                        Value val1, Value val2, Type llvmType, int64_t rank,
510f04384dSAlex Zinenko                        int64_t pos) {
52e7026abaSNicolas Vasilache   assert(rank > 0 && "0-D vector corner case should have been handled already");
531c81adf3SAart Bik   if (rank == 1) {
541c81adf3SAart Bik     auto idxType = rewriter.getIndexType();
551c81adf3SAart Bik     auto constant = rewriter.create<LLVM::ConstantOp>(
560f04384dSAlex Zinenko         loc, typeConverter.convertType(idxType),
571c81adf3SAart Bik         rewriter.getIntegerAttr(idxType, pos));
581c81adf3SAart Bik     return rewriter.create<LLVM::InsertElementOp>(loc, llvmType, val1, val2,
591c81adf3SAart Bik                                                   constant);
601c81adf3SAart Bik   }
611c81adf3SAart Bik   return rewriter.create<LLVM::InsertValueOp>(loc, llvmType, val1, val2,
621c81adf3SAart Bik                                               rewriter.getI64ArrayAttr(pos));
631c81adf3SAart Bik }
641c81adf3SAart Bik 
651c81adf3SAart Bik // Helper that picks the proper sequence for extracting.
extractOne(ConversionPatternRewriter & rewriter,LLVMTypeConverter & typeConverter,Location loc,Value val,Type llvmType,int64_t rank,int64_t pos)66e62a6956SRiver Riddle static Value extractOne(ConversionPatternRewriter &rewriter,
670f04384dSAlex Zinenko                         LLVMTypeConverter &typeConverter, Location loc,
680f04384dSAlex Zinenko                         Value val, Type llvmType, int64_t rank, int64_t pos) {
69cc311a15SMichal Terepeta   if (rank <= 1) {
701c81adf3SAart Bik     auto idxType = rewriter.getIndexType();
711c81adf3SAart Bik     auto constant = rewriter.create<LLVM::ConstantOp>(
720f04384dSAlex Zinenko         loc, typeConverter.convertType(idxType),
731c81adf3SAart Bik         rewriter.getIntegerAttr(idxType, pos));
741c81adf3SAart Bik     return rewriter.create<LLVM::ExtractElementOp>(loc, llvmType, val,
751c81adf3SAart Bik                                                    constant);
761c81adf3SAart Bik   }
771c81adf3SAart Bik   return rewriter.create<LLVM::ExtractValueOp>(loc, llvmType, val,
781c81adf3SAart Bik                                                rewriter.getI64ArrayAttr(pos));
791c81adf3SAart Bik }
801c81adf3SAart Bik 
8126c8f908SThomas Raoux // Helper that returns data layout alignment of a memref.
getMemRefAlignment(LLVMTypeConverter & typeConverter,MemRefType memrefType,unsigned & align)8226c8f908SThomas Raoux LogicalResult getMemRefAlignment(LLVMTypeConverter &typeConverter,
8326c8f908SThomas Raoux                                  MemRefType memrefType, unsigned &align) {
8426c8f908SThomas Raoux   Type elementTy = typeConverter.convertType(memrefType.getElementType());
855f9e0466SNicolas Vasilache   if (!elementTy)
865f9e0466SNicolas Vasilache     return failure();
875f9e0466SNicolas Vasilache 
88b2ab375dSAlex Zinenko   // TODO: this should use the MLIR data layout when it becomes available and
89b2ab375dSAlex Zinenko   // stop depending on translation.
9087a89e0fSAlex Zinenko   llvm::LLVMContext llvmContext;
9187a89e0fSAlex Zinenko   align = LLVM::TypeToLLVMIRTranslator(llvmContext)
92c69c9e0fSAlex Zinenko               .getPreferredAlignment(elementTy, typeConverter.getDataLayout());
935f9e0466SNicolas Vasilache   return success();
945f9e0466SNicolas Vasilache }
955f9e0466SNicolas Vasilache 
96df5ccf5aSAart Bik // Add an index vector component to a base pointer. This almost always succeeds
97df5ccf5aSAart Bik // unless the last stride is non-unit or the memory space is not zero.
getIndexedPtrs(ConversionPatternRewriter & rewriter,Location loc,Value memref,Value base,Value index,MemRefType memRefType,VectorType vType,Value & ptrs)98df5ccf5aSAart Bik static LogicalResult getIndexedPtrs(ConversionPatternRewriter &rewriter,
99df5ccf5aSAart Bik                                     Location loc, Value memref, Value base,
100df5ccf5aSAart Bik                                     Value index, MemRefType memRefType,
101df5ccf5aSAart Bik                                     VectorType vType, Value &ptrs) {
10219dbb230Saartbik   int64_t offset;
10319dbb230Saartbik   SmallVector<int64_t, 4> strides;
10419dbb230Saartbik   auto successStrides = getStridesAndOffset(memRefType, strides, offset);
105df5ccf5aSAart Bik   if (failed(successStrides) || strides.back() != 1 ||
10637eca08eSVladislav Vinogradov       memRefType.getMemorySpaceAsInt() != 0)
107e8dcf5f8Saartbik     return failure();
1083a577f54SChristian Sigg   auto pType = MemRefDescriptor(memref).getElementPtrType();
109bd30a796SAlex Zinenko   auto ptrsType = LLVM::getFixedVectorType(pType, vType.getDimSize(0));
110df5ccf5aSAart Bik   ptrs = rewriter.create<LLVM::GEPOp>(loc, ptrsType, base, index);
11119dbb230Saartbik   return success();
11219dbb230Saartbik }
11319dbb230Saartbik 
114a57def30SAart Bik // Casts a strided element pointer to a vector pointer.  The vector pointer
11508c681f6SAndrew Pritchard // will be in the same address space as the incoming memref type.
castDataPtr(ConversionPatternRewriter & rewriter,Location loc,Value ptr,MemRefType memRefType,Type vt)116a57def30SAart Bik static Value castDataPtr(ConversionPatternRewriter &rewriter, Location loc,
117a57def30SAart Bik                          Value ptr, MemRefType memRefType, Type vt) {
11837eca08eSVladislav Vinogradov   auto pType = LLVM::LLVMPointerType::get(vt, memRefType.getMemorySpaceAsInt());
119a57def30SAart Bik   return rewriter.create<LLVM::BitcastOp>(loc, pType, ptr);
120a57def30SAart Bik }
121a57def30SAart Bik 
12290c01357SBenjamin Kramer namespace {
123e83b7b99Saartbik 
124a4830d14SJavier Setoain /// Trivial Vector to LLVM conversions
125a4830d14SJavier Setoain using VectorScaleOpConversion =
126a4830d14SJavier Setoain     OneToOneConvertToLLVMPattern<vector::VectorScaleOp, LLVM::vscale>;
127a4830d14SJavier Setoain 
128cf5c517cSDiego Caballero /// Conversion pattern for a vector.bitcast.
129cf5c517cSDiego Caballero class VectorBitCastOpConversion
130cf5c517cSDiego Caballero     : public ConvertOpToLLVMPattern<vector::BitCastOp> {
131cf5c517cSDiego Caballero public:
132cf5c517cSDiego Caballero   using ConvertOpToLLVMPattern<vector::BitCastOp>::ConvertOpToLLVMPattern;
133cf5c517cSDiego Caballero 
134cf5c517cSDiego Caballero   LogicalResult
matchAndRewrite(vector::BitCastOp bitCastOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const135ef976337SRiver Riddle   matchAndRewrite(vector::BitCastOp bitCastOp, OpAdaptor adaptor,
136cf5c517cSDiego Caballero                   ConversionPatternRewriter &rewriter) const override {
1371423e8bfSMichal Terepeta     // Only 0-D and 1-D vectors can be lowered to LLVM.
1381423e8bfSMichal Terepeta     VectorType resultTy = bitCastOp.getResultVectorType();
1391423e8bfSMichal Terepeta     if (resultTy.getRank() > 1)
140cf5c517cSDiego Caballero       return failure();
141cf5c517cSDiego Caballero     Type newResultTy = typeConverter->convertType(resultTy);
142cf5c517cSDiego Caballero     rewriter.replaceOpWithNewOp<LLVM::BitcastOp>(bitCastOp, newResultTy,
143ef976337SRiver Riddle                                                  adaptor.getOperands()[0]);
144cf5c517cSDiego Caballero     return success();
145cf5c517cSDiego Caballero   }
146cf5c517cSDiego Caballero };
147cf5c517cSDiego Caballero 
14863b683a8SNicolas Vasilache /// Conversion pattern for a vector.matrix_multiply.
14963b683a8SNicolas Vasilache /// This is lowered directly to the proper llvm.intr.matrix.multiply.
150563879b6SRahul Joshi class VectorMatmulOpConversion
151563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::MatmulOp> {
15263b683a8SNicolas Vasilache public:
153563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::MatmulOp>::ConvertOpToLLVMPattern;
15463b683a8SNicolas Vasilache 
1553145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::MatmulOp matmulOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const156ef976337SRiver Riddle   matchAndRewrite(vector::MatmulOp matmulOp, OpAdaptor adaptor,
15763b683a8SNicolas Vasilache                   ConversionPatternRewriter &rewriter) const override {
15863b683a8SNicolas Vasilache     rewriter.replaceOpWithNewOp<LLVM::MatrixMultiplyOp>(
1597c38fd60SJacques Pienaar         matmulOp, typeConverter->convertType(matmulOp.getRes().getType()),
1607c38fd60SJacques Pienaar         adaptor.getLhs(), adaptor.getRhs(), matmulOp.getLhsRows(),
1617c38fd60SJacques Pienaar         matmulOp.getLhsColumns(), matmulOp.getRhsColumns());
1623145427dSRiver Riddle     return success();
16363b683a8SNicolas Vasilache   }
16463b683a8SNicolas Vasilache };
16563b683a8SNicolas Vasilache 
166c295a65dSaartbik /// Conversion pattern for a vector.flat_transpose.
167c295a65dSaartbik /// This is lowered directly to the proper llvm.intr.matrix.transpose.
168563879b6SRahul Joshi class VectorFlatTransposeOpConversion
169563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::FlatTransposeOp> {
170c295a65dSaartbik public:
171563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::FlatTransposeOp>::ConvertOpToLLVMPattern;
172c295a65dSaartbik 
173c295a65dSaartbik   LogicalResult
matchAndRewrite(vector::FlatTransposeOp transOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const174ef976337SRiver Riddle   matchAndRewrite(vector::FlatTransposeOp transOp, OpAdaptor adaptor,
175c295a65dSaartbik                   ConversionPatternRewriter &rewriter) const override {
176c295a65dSaartbik     rewriter.replaceOpWithNewOp<LLVM::MatrixTransposeOp>(
1777c38fd60SJacques Pienaar         transOp, typeConverter->convertType(transOp.getRes().getType()),
1787c38fd60SJacques Pienaar         adaptor.getMatrix(), transOp.getRows(), transOp.getColumns());
179c295a65dSaartbik     return success();
180c295a65dSaartbik   }
181c295a65dSaartbik };
182c295a65dSaartbik 
183ee66e43aSDiego Caballero /// Overloaded utility that replaces a vector.load, vector.store,
184ee66e43aSDiego Caballero /// vector.maskedload and vector.maskedstore with their respective LLVM
185ee66e43aSDiego Caballero /// couterparts.
replaceLoadOrStoreOp(vector::LoadOp loadOp,vector::LoadOpAdaptor adaptor,VectorType vectorTy,Value ptr,unsigned align,ConversionPatternRewriter & rewriter)186ee66e43aSDiego Caballero static void replaceLoadOrStoreOp(vector::LoadOp loadOp,
187ee66e43aSDiego Caballero                                  vector::LoadOpAdaptor adaptor,
188ee66e43aSDiego Caballero                                  VectorType vectorTy, Value ptr, unsigned align,
189ee66e43aSDiego Caballero                                  ConversionPatternRewriter &rewriter) {
190ee66e43aSDiego Caballero   rewriter.replaceOpWithNewOp<LLVM::LoadOp>(loadOp, ptr, align);
19139379916Saartbik }
19239379916Saartbik 
replaceLoadOrStoreOp(vector::MaskedLoadOp loadOp,vector::MaskedLoadOpAdaptor adaptor,VectorType vectorTy,Value ptr,unsigned align,ConversionPatternRewriter & rewriter)193ee66e43aSDiego Caballero static void replaceLoadOrStoreOp(vector::MaskedLoadOp loadOp,
194ee66e43aSDiego Caballero                                  vector::MaskedLoadOpAdaptor adaptor,
195ee66e43aSDiego Caballero                                  VectorType vectorTy, Value ptr, unsigned align,
196ee66e43aSDiego Caballero                                  ConversionPatternRewriter &rewriter) {
197ee66e43aSDiego Caballero   rewriter.replaceOpWithNewOp<LLVM::MaskedLoadOp>(
1987c38fd60SJacques Pienaar       loadOp, vectorTy, ptr, adaptor.getMask(), adaptor.getPassThru(), align);
199ee66e43aSDiego Caballero }
200ee66e43aSDiego Caballero 
replaceLoadOrStoreOp(vector::StoreOp storeOp,vector::StoreOpAdaptor adaptor,VectorType vectorTy,Value ptr,unsigned align,ConversionPatternRewriter & rewriter)201ee66e43aSDiego Caballero static void replaceLoadOrStoreOp(vector::StoreOp storeOp,
202ee66e43aSDiego Caballero                                  vector::StoreOpAdaptor adaptor,
203ee66e43aSDiego Caballero                                  VectorType vectorTy, Value ptr, unsigned align,
204ee66e43aSDiego Caballero                                  ConversionPatternRewriter &rewriter) {
2057c38fd60SJacques Pienaar   rewriter.replaceOpWithNewOp<LLVM::StoreOp>(storeOp, adaptor.getValueToStore(),
206ee66e43aSDiego Caballero                                              ptr, align);
207ee66e43aSDiego Caballero }
208ee66e43aSDiego Caballero 
replaceLoadOrStoreOp(vector::MaskedStoreOp storeOp,vector::MaskedStoreOpAdaptor adaptor,VectorType vectorTy,Value ptr,unsigned align,ConversionPatternRewriter & rewriter)209ee66e43aSDiego Caballero static void replaceLoadOrStoreOp(vector::MaskedStoreOp storeOp,
210ee66e43aSDiego Caballero                                  vector::MaskedStoreOpAdaptor adaptor,
211ee66e43aSDiego Caballero                                  VectorType vectorTy, Value ptr, unsigned align,
212ee66e43aSDiego Caballero                                  ConversionPatternRewriter &rewriter) {
213ee66e43aSDiego Caballero   rewriter.replaceOpWithNewOp<LLVM::MaskedStoreOp>(
2147c38fd60SJacques Pienaar       storeOp, adaptor.getValueToStore(), ptr, adaptor.getMask(), align);
215ee66e43aSDiego Caballero }
216ee66e43aSDiego Caballero 
217ee66e43aSDiego Caballero /// Conversion pattern for a vector.load, vector.store, vector.maskedload, and
218ee66e43aSDiego Caballero /// vector.maskedstore.
219ee66e43aSDiego Caballero template <class LoadOrStoreOp, class LoadOrStoreOpAdaptor>
220ee66e43aSDiego Caballero class VectorLoadStoreConversion : public ConvertOpToLLVMPattern<LoadOrStoreOp> {
22139379916Saartbik public:
222ee66e43aSDiego Caballero   using ConvertOpToLLVMPattern<LoadOrStoreOp>::ConvertOpToLLVMPattern;
22339379916Saartbik 
22439379916Saartbik   LogicalResult
matchAndRewrite(LoadOrStoreOp loadOrStoreOp,typename LoadOrStoreOp::Adaptor adaptor,ConversionPatternRewriter & rewriter) const225ef976337SRiver Riddle   matchAndRewrite(LoadOrStoreOp loadOrStoreOp,
226ef976337SRiver Riddle                   typename LoadOrStoreOp::Adaptor adaptor,
22739379916Saartbik                   ConversionPatternRewriter &rewriter) const override {
228ee66e43aSDiego Caballero     // Only 1-D vectors can be lowered to LLVM.
229ee66e43aSDiego Caballero     VectorType vectorTy = loadOrStoreOp.getVectorType();
230ee66e43aSDiego Caballero     if (vectorTy.getRank() > 1)
231ee66e43aSDiego Caballero       return failure();
232ee66e43aSDiego Caballero 
233ee66e43aSDiego Caballero     auto loc = loadOrStoreOp->getLoc();
234ee66e43aSDiego Caballero     MemRefType memRefTy = loadOrStoreOp.getMemRefType();
23539379916Saartbik 
23639379916Saartbik     // Resolve alignment.
23739379916Saartbik     unsigned align;
23873863648SStephen Neuendorffer     if (failed(getMemRefAlignment(*this->getTypeConverter(), memRefTy, align)))
23939379916Saartbik       return failure();
24039379916Saartbik 
241a57def30SAart Bik     // Resolve address.
242ee66e43aSDiego Caballero     auto vtype = this->typeConverter->convertType(loadOrStoreOp.getVectorType())
243ee66e43aSDiego Caballero                      .template cast<VectorType>();
2447c38fd60SJacques Pienaar     Value dataPtr = this->getStridedElementPtr(loc, memRefTy, adaptor.getBase(),
2457c38fd60SJacques Pienaar                                                adaptor.getIndices(), rewriter);
246ee66e43aSDiego Caballero     Value ptr = castDataPtr(rewriter, loc, dataPtr, memRefTy, vtype);
24739379916Saartbik 
248ee66e43aSDiego Caballero     replaceLoadOrStoreOp(loadOrStoreOp, adaptor, vtype, ptr, align, rewriter);
24939379916Saartbik     return success();
25039379916Saartbik   }
25139379916Saartbik };
25239379916Saartbik 
25319dbb230Saartbik /// Conversion pattern for a vector.gather.
254563879b6SRahul Joshi class VectorGatherOpConversion
255563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::GatherOp> {
25619dbb230Saartbik public:
257563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::GatherOp>::ConvertOpToLLVMPattern;
25819dbb230Saartbik 
25919dbb230Saartbik   LogicalResult
matchAndRewrite(vector::GatherOp gather,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const260ef976337SRiver Riddle   matchAndRewrite(vector::GatherOp gather, OpAdaptor adaptor,
26119dbb230Saartbik                   ConversionPatternRewriter &rewriter) const override {
262563879b6SRahul Joshi     auto loc = gather->getLoc();
263df5ccf5aSAart Bik     MemRefType memRefType = gather.getMemRefType();
26419dbb230Saartbik 
26519dbb230Saartbik     // Resolve alignment.
26619dbb230Saartbik     unsigned align;
26773863648SStephen Neuendorffer     if (failed(getMemRefAlignment(*getTypeConverter(), memRefType, align)))
26819dbb230Saartbik       return failure();
26919dbb230Saartbik 
270df5ccf5aSAart Bik     // Resolve address.
27119dbb230Saartbik     Value ptrs;
272df5ccf5aSAart Bik     VectorType vType = gather.getVectorType();
2737c38fd60SJacques Pienaar     Value ptr = getStridedElementPtr(loc, memRefType, adaptor.getBase(),
2747c38fd60SJacques Pienaar                                      adaptor.getIndices(), rewriter);
2757c38fd60SJacques Pienaar     if (failed(getIndexedPtrs(rewriter, loc, adaptor.getBase(), ptr,
2767c38fd60SJacques Pienaar                               adaptor.getIndexVec(), memRefType, vType, ptrs)))
27719dbb230Saartbik       return failure();
27819dbb230Saartbik 
27919dbb230Saartbik     // Replace with the gather intrinsic.
28019dbb230Saartbik     rewriter.replaceOpWithNewOp<LLVM::masked_gather>(
2817c38fd60SJacques Pienaar         gather, typeConverter->convertType(vType), ptrs, adaptor.getMask(),
2827c38fd60SJacques Pienaar         adaptor.getPassThru(), rewriter.getI32IntegerAttr(align));
28319dbb230Saartbik     return success();
28419dbb230Saartbik   }
28519dbb230Saartbik };
28619dbb230Saartbik 
28719dbb230Saartbik /// Conversion pattern for a vector.scatter.
288563879b6SRahul Joshi class VectorScatterOpConversion
289563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::ScatterOp> {
29019dbb230Saartbik public:
291563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::ScatterOp>::ConvertOpToLLVMPattern;
29219dbb230Saartbik 
29319dbb230Saartbik   LogicalResult
matchAndRewrite(vector::ScatterOp scatter,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const294ef976337SRiver Riddle   matchAndRewrite(vector::ScatterOp scatter, OpAdaptor adaptor,
29519dbb230Saartbik                   ConversionPatternRewriter &rewriter) const override {
296563879b6SRahul Joshi     auto loc = scatter->getLoc();
297df5ccf5aSAart Bik     MemRefType memRefType = scatter.getMemRefType();
29819dbb230Saartbik 
29919dbb230Saartbik     // Resolve alignment.
30019dbb230Saartbik     unsigned align;
30173863648SStephen Neuendorffer     if (failed(getMemRefAlignment(*getTypeConverter(), memRefType, align)))
30219dbb230Saartbik       return failure();
30319dbb230Saartbik 
304df5ccf5aSAart Bik     // Resolve address.
30519dbb230Saartbik     Value ptrs;
306df5ccf5aSAart Bik     VectorType vType = scatter.getVectorType();
3077c38fd60SJacques Pienaar     Value ptr = getStridedElementPtr(loc, memRefType, adaptor.getBase(),
3087c38fd60SJacques Pienaar                                      adaptor.getIndices(), rewriter);
3097c38fd60SJacques Pienaar     if (failed(getIndexedPtrs(rewriter, loc, adaptor.getBase(), ptr,
3107c38fd60SJacques Pienaar                               adaptor.getIndexVec(), memRefType, vType, ptrs)))
31119dbb230Saartbik       return failure();
31219dbb230Saartbik 
31319dbb230Saartbik     // Replace with the scatter intrinsic.
31419dbb230Saartbik     rewriter.replaceOpWithNewOp<LLVM::masked_scatter>(
3157c38fd60SJacques Pienaar         scatter, adaptor.getValueToStore(), ptrs, adaptor.getMask(),
31619dbb230Saartbik         rewriter.getI32IntegerAttr(align));
31719dbb230Saartbik     return success();
31819dbb230Saartbik   }
31919dbb230Saartbik };
32019dbb230Saartbik 
321e8dcf5f8Saartbik /// Conversion pattern for a vector.expandload.
322563879b6SRahul Joshi class VectorExpandLoadOpConversion
323563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::ExpandLoadOp> {
324e8dcf5f8Saartbik public:
325563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::ExpandLoadOp>::ConvertOpToLLVMPattern;
326e8dcf5f8Saartbik 
327e8dcf5f8Saartbik   LogicalResult
matchAndRewrite(vector::ExpandLoadOp expand,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const328ef976337SRiver Riddle   matchAndRewrite(vector::ExpandLoadOp expand, OpAdaptor adaptor,
329e8dcf5f8Saartbik                   ConversionPatternRewriter &rewriter) const override {
330563879b6SRahul Joshi     auto loc = expand->getLoc();
331a57def30SAart Bik     MemRefType memRefType = expand.getMemRefType();
332e8dcf5f8Saartbik 
333a57def30SAart Bik     // Resolve address.
334656674a7SDiego Caballero     auto vtype = typeConverter->convertType(expand.getVectorType());
3357c38fd60SJacques Pienaar     Value ptr = getStridedElementPtr(loc, memRefType, adaptor.getBase(),
3367c38fd60SJacques Pienaar                                      adaptor.getIndices(), rewriter);
337e8dcf5f8Saartbik 
338e8dcf5f8Saartbik     rewriter.replaceOpWithNewOp<LLVM::masked_expandload>(
3397c38fd60SJacques Pienaar         expand, vtype, ptr, adaptor.getMask(), adaptor.getPassThru());
340e8dcf5f8Saartbik     return success();
341e8dcf5f8Saartbik   }
342e8dcf5f8Saartbik };
343e8dcf5f8Saartbik 
344e8dcf5f8Saartbik /// Conversion pattern for a vector.compressstore.
345563879b6SRahul Joshi class VectorCompressStoreOpConversion
346563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::CompressStoreOp> {
347e8dcf5f8Saartbik public:
348563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::CompressStoreOp>::ConvertOpToLLVMPattern;
349e8dcf5f8Saartbik 
350e8dcf5f8Saartbik   LogicalResult
matchAndRewrite(vector::CompressStoreOp compress,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const351ef976337SRiver Riddle   matchAndRewrite(vector::CompressStoreOp compress, OpAdaptor adaptor,
352e8dcf5f8Saartbik                   ConversionPatternRewriter &rewriter) const override {
353563879b6SRahul Joshi     auto loc = compress->getLoc();
354a57def30SAart Bik     MemRefType memRefType = compress.getMemRefType();
355e8dcf5f8Saartbik 
356a57def30SAart Bik     // Resolve address.
3577c38fd60SJacques Pienaar     Value ptr = getStridedElementPtr(loc, memRefType, adaptor.getBase(),
3587c38fd60SJacques Pienaar                                      adaptor.getIndices(), rewriter);
359e8dcf5f8Saartbik 
360e8dcf5f8Saartbik     rewriter.replaceOpWithNewOp<LLVM::masked_compressstore>(
3617c38fd60SJacques Pienaar         compress, adaptor.getValueToStore(), ptr, adaptor.getMask());
362e8dcf5f8Saartbik     return success();
363e8dcf5f8Saartbik   }
364e8dcf5f8Saartbik };
365e8dcf5f8Saartbik 
366fa596c69SMahesh Ravishankar /// Helper method to lower a `vector.reduction` op that performs an arithmetic
367fa596c69SMahesh Ravishankar /// operation like add,mul, etc.. `VectorOp` is the LLVM vector intrinsic to use
368fa596c69SMahesh Ravishankar /// and `ScalarOp` is the scalar operation used to add the accumulation value if
369fa596c69SMahesh Ravishankar /// non-null.
370fa596c69SMahesh Ravishankar template <class VectorOp, class ScalarOp>
createIntegerReductionArithmeticOpLowering(ConversionPatternRewriter & rewriter,Location loc,Type llvmType,Value vectorOperand,Value accumulator)371fa596c69SMahesh Ravishankar static Value createIntegerReductionArithmeticOpLowering(
372fa596c69SMahesh Ravishankar     ConversionPatternRewriter &rewriter, Location loc, Type llvmType,
373fa596c69SMahesh Ravishankar     Value vectorOperand, Value accumulator) {
374fa596c69SMahesh Ravishankar   Value result = rewriter.create<VectorOp>(loc, llvmType, vectorOperand);
375fa596c69SMahesh Ravishankar   if (accumulator)
376fa596c69SMahesh Ravishankar     result = rewriter.create<ScalarOp>(loc, accumulator, result);
377fa596c69SMahesh Ravishankar   return result;
378fa596c69SMahesh Ravishankar }
379fa596c69SMahesh Ravishankar 
380fa596c69SMahesh Ravishankar /// Helper method to lower a `vector.reduction` operation that performs
381fa596c69SMahesh Ravishankar /// a comparison operation like `min`/`max`. `VectorOp` is the LLVM vector
382fa596c69SMahesh Ravishankar /// intrinsic to use and `predicate` is the predicate to use to compare+combine
383fa596c69SMahesh Ravishankar /// the accumulator value if non-null.
384fa596c69SMahesh Ravishankar template <class VectorOp>
createIntegerReductionComparisonOpLowering(ConversionPatternRewriter & rewriter,Location loc,Type llvmType,Value vectorOperand,Value accumulator,LLVM::ICmpPredicate predicate)385fa596c69SMahesh Ravishankar static Value createIntegerReductionComparisonOpLowering(
386fa596c69SMahesh Ravishankar     ConversionPatternRewriter &rewriter, Location loc, Type llvmType,
387fa596c69SMahesh Ravishankar     Value vectorOperand, Value accumulator, LLVM::ICmpPredicate predicate) {
388fa596c69SMahesh Ravishankar   Value result = rewriter.create<VectorOp>(loc, llvmType, vectorOperand);
389fa596c69SMahesh Ravishankar   if (accumulator) {
390fa596c69SMahesh Ravishankar     Value cmp =
391fa596c69SMahesh Ravishankar         rewriter.create<LLVM::ICmpOp>(loc, predicate, accumulator, result);
392fa596c69SMahesh Ravishankar     result = rewriter.create<LLVM::SelectOp>(loc, cmp, accumulator, result);
393fa596c69SMahesh Ravishankar   }
394fa596c69SMahesh Ravishankar   return result;
395fa596c69SMahesh Ravishankar }
396fa596c69SMahesh Ravishankar 
3978fe076ffSThomas Raoux /// Create lowering of minf/maxf op. We cannot use llvm.maximum/llvm.minimum
3988fe076ffSThomas Raoux /// with vector types.
createMinMaxF(OpBuilder & builder,Location loc,Value lhs,Value rhs,bool isMin)3998fe076ffSThomas Raoux static Value createMinMaxF(OpBuilder &builder, Location loc, Value lhs,
4008fe076ffSThomas Raoux                            Value rhs, bool isMin) {
4018fe076ffSThomas Raoux   auto floatType = getElementTypeOrSelf(lhs.getType()).cast<FloatType>();
4028fe076ffSThomas Raoux   Type i1Type = builder.getI1Type();
4038fe076ffSThomas Raoux   if (auto vecType = lhs.getType().dyn_cast<VectorType>())
4048fe076ffSThomas Raoux     i1Type = VectorType::get(vecType.getShape(), i1Type);
4058fe076ffSThomas Raoux   Value cmp = builder.create<LLVM::FCmpOp>(
4068fe076ffSThomas Raoux       loc, i1Type, isMin ? LLVM::FCmpPredicate::olt : LLVM::FCmpPredicate::ogt,
4078fe076ffSThomas Raoux       lhs, rhs);
4088fe076ffSThomas Raoux   Value sel = builder.create<LLVM::SelectOp>(loc, cmp, lhs, rhs);
4098fe076ffSThomas Raoux   Value isNan = builder.create<LLVM::FCmpOp>(
4108fe076ffSThomas Raoux       loc, i1Type, LLVM::FCmpPredicate::uno, lhs, rhs);
4118fe076ffSThomas Raoux   Value nan = builder.create<LLVM::ConstantOp>(
4128fe076ffSThomas Raoux       loc, lhs.getType(),
4138fe076ffSThomas Raoux       builder.getFloatAttr(floatType,
4148fe076ffSThomas Raoux                            APFloat::getQNaN(floatType.getFloatSemantics())));
4158fe076ffSThomas Raoux   return builder.create<LLVM::SelectOp>(loc, isNan, nan, sel);
4168fe076ffSThomas Raoux }
4178fe076ffSThomas Raoux 
41819dbb230Saartbik /// Conversion pattern for all vector reductions.
419563879b6SRahul Joshi class VectorReductionOpConversion
420563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::ReductionOp> {
421e83b7b99Saartbik public:
VectorReductionOpConversion(LLVMTypeConverter & typeConv,bool reassociateFPRed)422563879b6SRahul Joshi   explicit VectorReductionOpConversion(LLVMTypeConverter &typeConv,
423060c9dd1Saartbik                                        bool reassociateFPRed)
424563879b6SRahul Joshi       : ConvertOpToLLVMPattern<vector::ReductionOp>(typeConv),
425060c9dd1Saartbik         reassociateFPReductions(reassociateFPRed) {}
426e83b7b99Saartbik 
4273145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::ReductionOp reductionOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const428ef976337SRiver Riddle   matchAndRewrite(vector::ReductionOp reductionOp, OpAdaptor adaptor,
429e83b7b99Saartbik                   ConversionPatternRewriter &rewriter) const override {
4307c38fd60SJacques Pienaar     auto kind = reductionOp.getKind();
4317c38fd60SJacques Pienaar     Type eltType = reductionOp.getDest().getType();
432dcec2ca5SChristian Sigg     Type llvmType = typeConverter->convertType(eltType);
433fa596c69SMahesh Ravishankar     Value operand = adaptor.getVector();
434fa596c69SMahesh Ravishankar     Value acc = adaptor.getAcc();
435fa596c69SMahesh Ravishankar     Location loc = reductionOp.getLoc();
436e9628955SAart Bik     if (eltType.isIntOrIndex()) {
437e83b7b99Saartbik       // Integer reductions: add/mul/min/max/and/or/xor.
438fa596c69SMahesh Ravishankar       Value result;
439fa596c69SMahesh Ravishankar       switch (kind) {
440fa596c69SMahesh Ravishankar       case vector::CombiningKind::ADD:
441fa596c69SMahesh Ravishankar         result =
442fa596c69SMahesh Ravishankar             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_add,
443fa596c69SMahesh Ravishankar                                                        LLVM::AddOp>(
444fa596c69SMahesh Ravishankar                 rewriter, loc, llvmType, operand, acc);
445fa596c69SMahesh Ravishankar         break;
446fa596c69SMahesh Ravishankar       case vector::CombiningKind::MUL:
447fa596c69SMahesh Ravishankar         result =
448fa596c69SMahesh Ravishankar             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_mul,
449fa596c69SMahesh Ravishankar                                                        LLVM::MulOp>(
450fa596c69SMahesh Ravishankar                 rewriter, loc, llvmType, operand, acc);
451fa596c69SMahesh Ravishankar         break;
452fa596c69SMahesh Ravishankar       case vector::CombiningKind::MINUI:
453fa596c69SMahesh Ravishankar         result = createIntegerReductionComparisonOpLowering<
454fa596c69SMahesh Ravishankar             LLVM::vector_reduce_umin>(rewriter, loc, llvmType, operand, acc,
455fa596c69SMahesh Ravishankar                                       LLVM::ICmpPredicate::ule);
456fa596c69SMahesh Ravishankar         break;
457fa596c69SMahesh Ravishankar       case vector::CombiningKind::MINSI:
458fa596c69SMahesh Ravishankar         result = createIntegerReductionComparisonOpLowering<
459fa596c69SMahesh Ravishankar             LLVM::vector_reduce_smin>(rewriter, loc, llvmType, operand, acc,
460fa596c69SMahesh Ravishankar                                       LLVM::ICmpPredicate::sle);
461fa596c69SMahesh Ravishankar         break;
462fa596c69SMahesh Ravishankar       case vector::CombiningKind::MAXUI:
463fa596c69SMahesh Ravishankar         result = createIntegerReductionComparisonOpLowering<
464fa596c69SMahesh Ravishankar             LLVM::vector_reduce_umax>(rewriter, loc, llvmType, operand, acc,
465fa596c69SMahesh Ravishankar                                       LLVM::ICmpPredicate::uge);
466fa596c69SMahesh Ravishankar         break;
467fa596c69SMahesh Ravishankar       case vector::CombiningKind::MAXSI:
468fa596c69SMahesh Ravishankar         result = createIntegerReductionComparisonOpLowering<
469fa596c69SMahesh Ravishankar             LLVM::vector_reduce_smax>(rewriter, loc, llvmType, operand, acc,
470fa596c69SMahesh Ravishankar                                       LLVM::ICmpPredicate::sge);
471fa596c69SMahesh Ravishankar         break;
472fa596c69SMahesh Ravishankar       case vector::CombiningKind::AND:
473fa596c69SMahesh Ravishankar         result =
474fa596c69SMahesh Ravishankar             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_and,
475fa596c69SMahesh Ravishankar                                                        LLVM::AndOp>(
476fa596c69SMahesh Ravishankar                 rewriter, loc, llvmType, operand, acc);
477fa596c69SMahesh Ravishankar         break;
478fa596c69SMahesh Ravishankar       case vector::CombiningKind::OR:
479fa596c69SMahesh Ravishankar         result =
480fa596c69SMahesh Ravishankar             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_or,
481fa596c69SMahesh Ravishankar                                                        LLVM::OrOp>(
482fa596c69SMahesh Ravishankar                 rewriter, loc, llvmType, operand, acc);
483fa596c69SMahesh Ravishankar         break;
484fa596c69SMahesh Ravishankar       case vector::CombiningKind::XOR:
485fa596c69SMahesh Ravishankar         result =
486fa596c69SMahesh Ravishankar             createIntegerReductionArithmeticOpLowering<LLVM::vector_reduce_xor,
487fa596c69SMahesh Ravishankar                                                        LLVM::XOrOp>(
488fa596c69SMahesh Ravishankar                 rewriter, loc, llvmType, operand, acc);
489fa596c69SMahesh Ravishankar         break;
490fa596c69SMahesh Ravishankar       default:
4913145427dSRiver Riddle         return failure();
492fa596c69SMahesh Ravishankar       }
493fa596c69SMahesh Ravishankar       rewriter.replaceOp(reductionOp, result);
494fa596c69SMahesh Ravishankar 
4953145427dSRiver Riddle       return success();
496dcec2ca5SChristian Sigg     }
497e83b7b99Saartbik 
498dcec2ca5SChristian Sigg     if (!eltType.isa<FloatType>())
499dcec2ca5SChristian Sigg       return failure();
500dcec2ca5SChristian Sigg 
501e83b7b99Saartbik     // Floating-point reductions: add/mul/min/max
502fe0bf7d4SMatthias Springer     if (kind == vector::CombiningKind::ADD) {
5030d924700Saartbik       // Optional accumulator (or zero).
504ef976337SRiver Riddle       Value acc = adaptor.getOperands().size() > 1
505ef976337SRiver Riddle                       ? adaptor.getOperands()[1]
5060d924700Saartbik                       : rewriter.create<LLVM::ConstantOp>(
507563879b6SRahul Joshi                             reductionOp->getLoc(), llvmType,
5080d924700Saartbik                             rewriter.getZeroAttr(eltType));
509322d0afdSAmara Emerson       rewriter.replaceOpWithNewOp<LLVM::vector_reduce_fadd>(
510ef976337SRiver Riddle           reductionOp, llvmType, acc, operand,
511ceb1b327Saartbik           rewriter.getBoolAttr(reassociateFPReductions));
512fe0bf7d4SMatthias Springer     } else if (kind == vector::CombiningKind::MUL) {
5130d924700Saartbik       // Optional accumulator (or one).
514ef976337SRiver Riddle       Value acc = adaptor.getOperands().size() > 1
515ef976337SRiver Riddle                       ? adaptor.getOperands()[1]
5160d924700Saartbik                       : rewriter.create<LLVM::ConstantOp>(
517563879b6SRahul Joshi                             reductionOp->getLoc(), llvmType,
5180d924700Saartbik                             rewriter.getFloatAttr(eltType, 1.0));
519322d0afdSAmara Emerson       rewriter.replaceOpWithNewOp<LLVM::vector_reduce_fmul>(
520ef976337SRiver Riddle           reductionOp, llvmType, acc, operand,
521ceb1b327Saartbik           rewriter.getBoolAttr(reassociateFPReductions));
5228fe076ffSThomas Raoux     } else if (kind == vector::CombiningKind::MINF) {
523eaf2588aSDiego Caballero       // FIXME: MLIR's 'minf' and LLVM's 'vector_reduce_fmin' do not handle
524eaf2588aSDiego Caballero       // NaNs/-0.0/+0.0 in the same way.
5258fe076ffSThomas Raoux       Value result =
5268fe076ffSThomas Raoux           rewriter.create<LLVM::vector_reduce_fmin>(loc, llvmType, operand);
5278fe076ffSThomas Raoux       if (acc)
5288fe076ffSThomas Raoux         result = createMinMaxF(rewriter, loc, result, acc, /*isMin=*/true);
5298fe076ffSThomas Raoux       rewriter.replaceOp(reductionOp, result);
5308fe076ffSThomas Raoux     } else if (kind == vector::CombiningKind::MAXF) {
531eaf2588aSDiego Caballero       // FIXME: MLIR's 'maxf' and LLVM's 'vector_reduce_fmax' do not handle
532eaf2588aSDiego Caballero       // NaNs/-0.0/+0.0 in the same way.
5338fe076ffSThomas Raoux       Value result =
5348fe076ffSThomas Raoux           rewriter.create<LLVM::vector_reduce_fmax>(loc, llvmType, operand);
5358fe076ffSThomas Raoux       if (acc)
5368fe076ffSThomas Raoux         result = createMinMaxF(rewriter, loc, result, acc, /*isMin=*/false);
5378fe076ffSThomas Raoux       rewriter.replaceOp(reductionOp, result);
5388fe076ffSThomas Raoux     } else
5393145427dSRiver Riddle       return failure();
5408fe076ffSThomas Raoux 
5413145427dSRiver Riddle     return success();
542e83b7b99Saartbik   }
543ceb1b327Saartbik 
544ceb1b327Saartbik private:
545ceb1b327Saartbik   const bool reassociateFPReductions;
546e83b7b99Saartbik };
547e83b7b99Saartbik 
548563879b6SRahul Joshi class VectorShuffleOpConversion
549563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::ShuffleOp> {
5501c81adf3SAart Bik public:
551563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::ShuffleOp>::ConvertOpToLLVMPattern;
5521c81adf3SAart Bik 
5533145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::ShuffleOp shuffleOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const554ef976337SRiver Riddle   matchAndRewrite(vector::ShuffleOp shuffleOp, OpAdaptor adaptor,
5551c81adf3SAart Bik                   ConversionPatternRewriter &rewriter) const override {
556563879b6SRahul Joshi     auto loc = shuffleOp->getLoc();
5571c81adf3SAart Bik     auto v1Type = shuffleOp.getV1VectorType();
5581c81adf3SAart Bik     auto v2Type = shuffleOp.getV2VectorType();
5591c81adf3SAart Bik     auto vectorType = shuffleOp.getVectorType();
560dcec2ca5SChristian Sigg     Type llvmType = typeConverter->convertType(vectorType);
5617c38fd60SJacques Pienaar     auto maskArrayAttr = shuffleOp.getMask();
5621c81adf3SAart Bik 
5631c81adf3SAart Bik     // Bail if result type cannot be lowered.
5641c81adf3SAart Bik     if (!llvmType)
5653145427dSRiver Riddle       return failure();
5661c81adf3SAart Bik 
5671c81adf3SAart Bik     // Get rank and dimension sizes.
5681c81adf3SAart Bik     int64_t rank = vectorType.getRank();
5691c81adf3SAart Bik     assert(v1Type.getRank() == rank);
5701c81adf3SAart Bik     assert(v2Type.getRank() == rank);
5711c81adf3SAart Bik     int64_t v1Dim = v1Type.getDimSize(0);
5721c81adf3SAart Bik 
5731c81adf3SAart Bik     // For rank 1, where both operands have *exactly* the same vector type,
5741c81adf3SAart Bik     // there is direct shuffle support in LLVM. Use it!
5751c81adf3SAart Bik     if (rank == 1 && v1Type == v2Type) {
576563879b6SRahul Joshi       Value llvmShuffleOp = rewriter.create<LLVM::ShuffleVectorOp>(
5777c38fd60SJacques Pienaar           loc, adaptor.getV1(), adaptor.getV2(), maskArrayAttr);
578563879b6SRahul Joshi       rewriter.replaceOp(shuffleOp, llvmShuffleOp);
5793145427dSRiver Riddle       return success();
580b36aaeafSAart Bik     }
581b36aaeafSAart Bik 
5821c81adf3SAart Bik     // For all other cases, insert the individual values individually.
5835a8a159bSMehdi Amini     Type eltType;
5845a8a159bSMehdi Amini     if (auto arrayType = llvmType.dyn_cast<LLVM::LLVMArrayType>())
5855a8a159bSMehdi Amini       eltType = arrayType.getElementType();
5865a8a159bSMehdi Amini     else
5875a8a159bSMehdi Amini       eltType = llvmType.cast<VectorType>().getElementType();
588e62a6956SRiver Riddle     Value insert = rewriter.create<LLVM::UndefOp>(loc, llvmType);
5891c81adf3SAart Bik     int64_t insPos = 0;
590e4853be2SMehdi Amini     for (const auto &en : llvm::enumerate(maskArrayAttr)) {
5911c81adf3SAart Bik       int64_t extPos = en.value().cast<IntegerAttr>().getInt();
5927c38fd60SJacques Pienaar       Value value = adaptor.getV1();
5931c81adf3SAart Bik       if (extPos >= v1Dim) {
5941c81adf3SAart Bik         extPos -= v1Dim;
5957c38fd60SJacques Pienaar         value = adaptor.getV2();
596b36aaeafSAart Bik       }
597dcec2ca5SChristian Sigg       Value extract = extractOne(rewriter, *getTypeConverter(), loc, value,
5985a8a159bSMehdi Amini                                  eltType, rank, extPos);
599dcec2ca5SChristian Sigg       insert = insertOne(rewriter, *getTypeConverter(), loc, insert, extract,
6000f04384dSAlex Zinenko                          llvmType, rank, insPos++);
6011c81adf3SAart Bik     }
602563879b6SRahul Joshi     rewriter.replaceOp(shuffleOp, insert);
6033145427dSRiver Riddle     return success();
604b36aaeafSAart Bik   }
605b36aaeafSAart Bik };
606b36aaeafSAart Bik 
607563879b6SRahul Joshi class VectorExtractElementOpConversion
608563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::ExtractElementOp> {
609cd5dab8aSAart Bik public:
610563879b6SRahul Joshi   using ConvertOpToLLVMPattern<
611563879b6SRahul Joshi       vector::ExtractElementOp>::ConvertOpToLLVMPattern;
612cd5dab8aSAart Bik 
6133145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::ExtractElementOp extractEltOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const614ef976337SRiver Riddle   matchAndRewrite(vector::ExtractElementOp extractEltOp, OpAdaptor adaptor,
615cd5dab8aSAart Bik                   ConversionPatternRewriter &rewriter) const override {
616cd5dab8aSAart Bik     auto vectorType = extractEltOp.getVectorType();
617dcec2ca5SChristian Sigg     auto llvmType = typeConverter->convertType(vectorType.getElementType());
618cd5dab8aSAart Bik 
619cd5dab8aSAart Bik     // Bail if result type cannot be lowered.
620cd5dab8aSAart Bik     if (!llvmType)
6213145427dSRiver Riddle       return failure();
622cd5dab8aSAart Bik 
623e7026abaSNicolas Vasilache     if (vectorType.getRank() == 0) {
624e7026abaSNicolas Vasilache       Location loc = extractEltOp.getLoc();
625e7026abaSNicolas Vasilache       auto idxType = rewriter.getIndexType();
626e7026abaSNicolas Vasilache       auto zero = rewriter.create<LLVM::ConstantOp>(
627e7026abaSNicolas Vasilache           loc, typeConverter->convertType(idxType),
628e7026abaSNicolas Vasilache           rewriter.getIntegerAttr(idxType, 0));
629e7026abaSNicolas Vasilache       rewriter.replaceOpWithNewOp<LLVM::ExtractElementOp>(
6307c38fd60SJacques Pienaar           extractEltOp, llvmType, adaptor.getVector(), zero);
631e7026abaSNicolas Vasilache       return success();
632e7026abaSNicolas Vasilache     }
633e7026abaSNicolas Vasilache 
634cd5dab8aSAart Bik     rewriter.replaceOpWithNewOp<LLVM::ExtractElementOp>(
6357c38fd60SJacques Pienaar         extractEltOp, llvmType, adaptor.getVector(), adaptor.getPosition());
6363145427dSRiver Riddle     return success();
637cd5dab8aSAart Bik   }
638cd5dab8aSAart Bik };
639cd5dab8aSAart Bik 
640563879b6SRahul Joshi class VectorExtractOpConversion
641563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::ExtractOp> {
6425c0c51a9SNicolas Vasilache public:
643563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::ExtractOp>::ConvertOpToLLVMPattern;
6445c0c51a9SNicolas Vasilache 
6453145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::ExtractOp extractOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const646ef976337SRiver Riddle   matchAndRewrite(vector::ExtractOp extractOp, OpAdaptor adaptor,
6475c0c51a9SNicolas Vasilache                   ConversionPatternRewriter &rewriter) const override {
648563879b6SRahul Joshi     auto loc = extractOp->getLoc();
6499826fe5cSAart Bik     auto vectorType = extractOp.getVectorType();
6502bdf33ccSRiver Riddle     auto resultType = extractOp.getResult().getType();
651dcec2ca5SChristian Sigg     auto llvmResultType = typeConverter->convertType(resultType);
6527c38fd60SJacques Pienaar     auto positionArrayAttr = extractOp.getPosition();
6539826fe5cSAart Bik 
6549826fe5cSAart Bik     // Bail if result type cannot be lowered.
6559826fe5cSAart Bik     if (!llvmResultType)
6563145427dSRiver Riddle       return failure();
6579826fe5cSAart Bik 
658864adf39SMatthias Springer     // Extract entire vector. Should be handled by folder, but just to be safe.
659864adf39SMatthias Springer     if (positionArrayAttr.empty()) {
6607c38fd60SJacques Pienaar       rewriter.replaceOp(extractOp, adaptor.getVector());
661864adf39SMatthias Springer       return success();
662864adf39SMatthias Springer     }
663864adf39SMatthias Springer 
6645c0c51a9SNicolas Vasilache     // One-shot extraction of vector from array (only requires extractvalue).
6655c0c51a9SNicolas Vasilache     if (resultType.isa<VectorType>()) {
666e62a6956SRiver Riddle       Value extracted = rewriter.create<LLVM::ExtractValueOp>(
6677c38fd60SJacques Pienaar           loc, llvmResultType, adaptor.getVector(), positionArrayAttr);
668563879b6SRahul Joshi       rewriter.replaceOp(extractOp, extracted);
6693145427dSRiver Riddle       return success();
6705c0c51a9SNicolas Vasilache     }
6715c0c51a9SNicolas Vasilache 
6729826fe5cSAart Bik     // Potential extraction of 1-D vector from array.
673563879b6SRahul Joshi     auto *context = extractOp->getContext();
6747c38fd60SJacques Pienaar     Value extracted = adaptor.getVector();
6755c0c51a9SNicolas Vasilache     auto positionAttrs = positionArrayAttr.getValue();
6765c0c51a9SNicolas Vasilache     if (positionAttrs.size() > 1) {
6779826fe5cSAart Bik       auto oneDVectorType = reducedVectorTypeBack(vectorType);
6785c0c51a9SNicolas Vasilache       auto nMinusOnePositionAttrs =
679c2c83e97STres Popp           ArrayAttr::get(context, positionAttrs.drop_back());
6805c0c51a9SNicolas Vasilache       extracted = rewriter.create<LLVM::ExtractValueOp>(
681dcec2ca5SChristian Sigg           loc, typeConverter->convertType(oneDVectorType), extracted,
6825c0c51a9SNicolas Vasilache           nMinusOnePositionAttrs);
6835c0c51a9SNicolas Vasilache     }
6845c0c51a9SNicolas Vasilache 
6855c0c51a9SNicolas Vasilache     // Remaining extraction of element from 1-D LLVM vector
6865c0c51a9SNicolas Vasilache     auto position = positionAttrs.back().cast<IntegerAttr>();
6872230bf99SAlex Zinenko     auto i64Type = IntegerType::get(rewriter.getContext(), 64);
6881d47564aSAart Bik     auto constant = rewriter.create<LLVM::ConstantOp>(loc, i64Type, position);
6895c0c51a9SNicolas Vasilache     extracted =
6905c0c51a9SNicolas Vasilache         rewriter.create<LLVM::ExtractElementOp>(loc, extracted, constant);
691563879b6SRahul Joshi     rewriter.replaceOp(extractOp, extracted);
6925c0c51a9SNicolas Vasilache 
6933145427dSRiver Riddle     return success();
6945c0c51a9SNicolas Vasilache   }
6955c0c51a9SNicolas Vasilache };
6965c0c51a9SNicolas Vasilache 
697681f929fSNicolas Vasilache /// Conversion pattern that turns a vector.fma on a 1-D vector
698681f929fSNicolas Vasilache /// into an llvm.intr.fmuladd. This is a trivial 1-1 conversion.
699681f929fSNicolas Vasilache /// This does not match vectors of n >= 2 rank.
700681f929fSNicolas Vasilache ///
701681f929fSNicolas Vasilache /// Example:
702681f929fSNicolas Vasilache /// ```
703681f929fSNicolas Vasilache ///  vector.fma %a, %a, %a : vector<8xf32>
704681f929fSNicolas Vasilache /// ```
705681f929fSNicolas Vasilache /// is converted to:
706681f929fSNicolas Vasilache /// ```
7073bffe602SBenjamin Kramer ///  llvm.intr.fmuladd %va, %va, %va:
708dd5165a9SAlex Zinenko ///    (!llvm."<8 x f32>">, !llvm<"<8 x f32>">, !llvm<"<8 x f32>">)
709dd5165a9SAlex Zinenko ///    -> !llvm."<8 x f32>">
710681f929fSNicolas Vasilache /// ```
711563879b6SRahul Joshi class VectorFMAOp1DConversion : public ConvertOpToLLVMPattern<vector::FMAOp> {
712681f929fSNicolas Vasilache public:
713563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::FMAOp>::ConvertOpToLLVMPattern;
714681f929fSNicolas Vasilache 
7153145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::FMAOp fmaOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const716ef976337SRiver Riddle   matchAndRewrite(vector::FMAOp fmaOp, OpAdaptor adaptor,
717681f929fSNicolas Vasilache                   ConversionPatternRewriter &rewriter) const override {
718681f929fSNicolas Vasilache     VectorType vType = fmaOp.getVectorType();
719681f929fSNicolas Vasilache     if (vType.getRank() != 1)
7203145427dSRiver Riddle       return failure();
7217c38fd60SJacques Pienaar     rewriter.replaceOpWithNewOp<LLVM::FMulAddOp>(
7227c38fd60SJacques Pienaar         fmaOp, adaptor.getLhs(), adaptor.getRhs(), adaptor.getAcc());
7233145427dSRiver Riddle     return success();
724681f929fSNicolas Vasilache   }
725681f929fSNicolas Vasilache };
726681f929fSNicolas Vasilache 
727563879b6SRahul Joshi class VectorInsertElementOpConversion
728563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::InsertElementOp> {
729cd5dab8aSAart Bik public:
730563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::InsertElementOp>::ConvertOpToLLVMPattern;
731cd5dab8aSAart Bik 
7323145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::InsertElementOp insertEltOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const733ef976337SRiver Riddle   matchAndRewrite(vector::InsertElementOp insertEltOp, OpAdaptor adaptor,
734cd5dab8aSAart Bik                   ConversionPatternRewriter &rewriter) const override {
735cd5dab8aSAart Bik     auto vectorType = insertEltOp.getDestVectorType();
736dcec2ca5SChristian Sigg     auto llvmType = typeConverter->convertType(vectorType);
737cd5dab8aSAart Bik 
738cd5dab8aSAart Bik     // Bail if result type cannot be lowered.
739cd5dab8aSAart Bik     if (!llvmType)
7403145427dSRiver Riddle       return failure();
741cd5dab8aSAart Bik 
7423ff4e5f2SNicolas Vasilache     if (vectorType.getRank() == 0) {
7433ff4e5f2SNicolas Vasilache       Location loc = insertEltOp.getLoc();
7443ff4e5f2SNicolas Vasilache       auto idxType = rewriter.getIndexType();
7453ff4e5f2SNicolas Vasilache       auto zero = rewriter.create<LLVM::ConstantOp>(
7463ff4e5f2SNicolas Vasilache           loc, typeConverter->convertType(idxType),
7473ff4e5f2SNicolas Vasilache           rewriter.getIntegerAttr(idxType, 0));
7483ff4e5f2SNicolas Vasilache       rewriter.replaceOpWithNewOp<LLVM::InsertElementOp>(
7497c38fd60SJacques Pienaar           insertEltOp, llvmType, adaptor.getDest(), adaptor.getSource(), zero);
7503ff4e5f2SNicolas Vasilache       return success();
7513ff4e5f2SNicolas Vasilache     }
7523ff4e5f2SNicolas Vasilache 
753cd5dab8aSAart Bik     rewriter.replaceOpWithNewOp<LLVM::InsertElementOp>(
7547c38fd60SJacques Pienaar         insertEltOp, llvmType, adaptor.getDest(), adaptor.getSource(),
7557c38fd60SJacques Pienaar         adaptor.getPosition());
7563145427dSRiver Riddle     return success();
757cd5dab8aSAart Bik   }
758cd5dab8aSAart Bik };
759cd5dab8aSAart Bik 
760563879b6SRahul Joshi class VectorInsertOpConversion
761563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::InsertOp> {
7629826fe5cSAart Bik public:
763563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::InsertOp>::ConvertOpToLLVMPattern;
7649826fe5cSAart Bik 
7653145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::InsertOp insertOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const766ef976337SRiver Riddle   matchAndRewrite(vector::InsertOp insertOp, OpAdaptor adaptor,
7679826fe5cSAart Bik                   ConversionPatternRewriter &rewriter) const override {
768563879b6SRahul Joshi     auto loc = insertOp->getLoc();
7699826fe5cSAart Bik     auto sourceType = insertOp.getSourceType();
7709826fe5cSAart Bik     auto destVectorType = insertOp.getDestVectorType();
771dcec2ca5SChristian Sigg     auto llvmResultType = typeConverter->convertType(destVectorType);
7727c38fd60SJacques Pienaar     auto positionArrayAttr = insertOp.getPosition();
7739826fe5cSAart Bik 
7749826fe5cSAart Bik     // Bail if result type cannot be lowered.
7759826fe5cSAart Bik     if (!llvmResultType)
7763145427dSRiver Riddle       return failure();
7779826fe5cSAart Bik 
778864adf39SMatthias Springer     // Overwrite entire vector with value. Should be handled by folder, but
779864adf39SMatthias Springer     // just to be safe.
780864adf39SMatthias Springer     if (positionArrayAttr.empty()) {
7817c38fd60SJacques Pienaar       rewriter.replaceOp(insertOp, adaptor.getSource());
782864adf39SMatthias Springer       return success();
783864adf39SMatthias Springer     }
784864adf39SMatthias Springer 
7859826fe5cSAart Bik     // One-shot insertion of a vector into an array (only requires insertvalue).
7869826fe5cSAart Bik     if (sourceType.isa<VectorType>()) {
787e62a6956SRiver Riddle       Value inserted = rewriter.create<LLVM::InsertValueOp>(
7887c38fd60SJacques Pienaar           loc, llvmResultType, adaptor.getDest(), adaptor.getSource(),
7899826fe5cSAart Bik           positionArrayAttr);
790563879b6SRahul Joshi       rewriter.replaceOp(insertOp, inserted);
7913145427dSRiver Riddle       return success();
7929826fe5cSAart Bik     }
7939826fe5cSAart Bik 
7949826fe5cSAart Bik     // Potential extraction of 1-D vector from array.
795563879b6SRahul Joshi     auto *context = insertOp->getContext();
7967c38fd60SJacques Pienaar     Value extracted = adaptor.getDest();
7979826fe5cSAart Bik     auto positionAttrs = positionArrayAttr.getValue();
7989826fe5cSAart Bik     auto position = positionAttrs.back().cast<IntegerAttr>();
7999826fe5cSAart Bik     auto oneDVectorType = destVectorType;
8009826fe5cSAart Bik     if (positionAttrs.size() > 1) {
8019826fe5cSAart Bik       oneDVectorType = reducedVectorTypeBack(destVectorType);
8029826fe5cSAart Bik       auto nMinusOnePositionAttrs =
803c2c83e97STres Popp           ArrayAttr::get(context, positionAttrs.drop_back());
8049826fe5cSAart Bik       extracted = rewriter.create<LLVM::ExtractValueOp>(
805dcec2ca5SChristian Sigg           loc, typeConverter->convertType(oneDVectorType), extracted,
8069826fe5cSAart Bik           nMinusOnePositionAttrs);
8079826fe5cSAart Bik     }
8089826fe5cSAart Bik 
8099826fe5cSAart Bik     // Insertion of an element into a 1-D LLVM vector.
8102230bf99SAlex Zinenko     auto i64Type = IntegerType::get(rewriter.getContext(), 64);
8111d47564aSAart Bik     auto constant = rewriter.create<LLVM::ConstantOp>(loc, i64Type, position);
812e62a6956SRiver Riddle     Value inserted = rewriter.create<LLVM::InsertElementOp>(
813dcec2ca5SChristian Sigg         loc, typeConverter->convertType(oneDVectorType), extracted,
8147c38fd60SJacques Pienaar         adaptor.getSource(), constant);
8159826fe5cSAart Bik 
8169826fe5cSAart Bik     // Potential insertion of resulting 1-D vector into array.
8179826fe5cSAart Bik     if (positionAttrs.size() > 1) {
8189826fe5cSAart Bik       auto nMinusOnePositionAttrs =
819c2c83e97STres Popp           ArrayAttr::get(context, positionAttrs.drop_back());
8207c38fd60SJacques Pienaar       inserted = rewriter.create<LLVM::InsertValueOp>(
8217c38fd60SJacques Pienaar           loc, llvmResultType, adaptor.getDest(), inserted,
8229826fe5cSAart Bik           nMinusOnePositionAttrs);
8239826fe5cSAart Bik     }
8249826fe5cSAart Bik 
825563879b6SRahul Joshi     rewriter.replaceOp(insertOp, inserted);
8263145427dSRiver Riddle     return success();
8279826fe5cSAart Bik   }
8289826fe5cSAart Bik };
8299826fe5cSAart Bik 
830681f929fSNicolas Vasilache /// Rank reducing rewrite for n-D FMA into (n-1)-D FMA where n > 1.
831681f929fSNicolas Vasilache ///
832681f929fSNicolas Vasilache /// Example:
833681f929fSNicolas Vasilache /// ```
834681f929fSNicolas Vasilache ///   %d = vector.fma %a, %b, %c : vector<2x4xf32>
835681f929fSNicolas Vasilache /// ```
836681f929fSNicolas Vasilache /// is rewritten into:
837681f929fSNicolas Vasilache /// ```
838681f929fSNicolas Vasilache ///  %r = splat %f0: vector<2x4xf32>
839681f929fSNicolas Vasilache ///  %va = vector.extractvalue %a[0] : vector<2x4xf32>
840681f929fSNicolas Vasilache ///  %vb = vector.extractvalue %b[0] : vector<2x4xf32>
841681f929fSNicolas Vasilache ///  %vc = vector.extractvalue %c[0] : vector<2x4xf32>
842681f929fSNicolas Vasilache ///  %vd = vector.fma %va, %vb, %vc : vector<4xf32>
843681f929fSNicolas Vasilache ///  %r2 = vector.insertvalue %vd, %r[0] : vector<4xf32> into vector<2x4xf32>
844681f929fSNicolas Vasilache ///  %va2 = vector.extractvalue %a2[1] : vector<2x4xf32>
845681f929fSNicolas Vasilache ///  %vb2 = vector.extractvalue %b2[1] : vector<2x4xf32>
846681f929fSNicolas Vasilache ///  %vc2 = vector.extractvalue %c2[1] : vector<2x4xf32>
847681f929fSNicolas Vasilache ///  %vd2 = vector.fma %va2, %vb2, %vc2 : vector<4xf32>
848681f929fSNicolas Vasilache ///  %r3 = vector.insertvalue %vd2, %r2[1] : vector<4xf32> into vector<2x4xf32>
849681f929fSNicolas Vasilache ///  // %r3 holds the final value.
850681f929fSNicolas Vasilache /// ```
851681f929fSNicolas Vasilache class VectorFMAOpNDRewritePattern : public OpRewritePattern<FMAOp> {
852681f929fSNicolas Vasilache public:
853681f929fSNicolas Vasilache   using OpRewritePattern<FMAOp>::OpRewritePattern;
854681f929fSNicolas Vasilache 
initialize()855ee80ffbfSNicolas Vasilache   void initialize() {
856ee80ffbfSNicolas Vasilache     // This pattern recursively unpacks one dimension at a time. The recursion
857ee80ffbfSNicolas Vasilache     // bounded as the rank is strictly decreasing.
858ee80ffbfSNicolas Vasilache     setHasBoundedRewriteRecursion();
859ee80ffbfSNicolas Vasilache   }
860ee80ffbfSNicolas Vasilache 
matchAndRewrite(FMAOp op,PatternRewriter & rewriter) const8613145427dSRiver Riddle   LogicalResult matchAndRewrite(FMAOp op,
862681f929fSNicolas Vasilache                                 PatternRewriter &rewriter) const override {
863681f929fSNicolas Vasilache     auto vType = op.getVectorType();
864681f929fSNicolas Vasilache     if (vType.getRank() < 2)
8653145427dSRiver Riddle       return failure();
866681f929fSNicolas Vasilache 
867681f929fSNicolas Vasilache     auto loc = op.getLoc();
868681f929fSNicolas Vasilache     auto elemType = vType.getElementType();
869a54f4eaeSMogball     Value zero = rewriter.create<arith::ConstantOp>(
870a54f4eaeSMogball         loc, elemType, rewriter.getZeroAttr(elemType));
8716a8ba318SRiver Riddle     Value desc = rewriter.create<vector::SplatOp>(loc, vType, zero);
872681f929fSNicolas Vasilache     for (int64_t i = 0, e = vType.getShape().front(); i != e; ++i) {
8737c38fd60SJacques Pienaar       Value extrLHS = rewriter.create<ExtractOp>(loc, op.getLhs(), i);
8747c38fd60SJacques Pienaar       Value extrRHS = rewriter.create<ExtractOp>(loc, op.getRhs(), i);
8757c38fd60SJacques Pienaar       Value extrACC = rewriter.create<ExtractOp>(loc, op.getAcc(), i);
876681f929fSNicolas Vasilache       Value fma = rewriter.create<FMAOp>(loc, extrLHS, extrRHS, extrACC);
877681f929fSNicolas Vasilache       desc = rewriter.create<InsertOp>(loc, fma, desc, i);
878681f929fSNicolas Vasilache     }
879681f929fSNicolas Vasilache     rewriter.replaceOp(op, desc);
8803145427dSRiver Riddle     return success();
881681f929fSNicolas Vasilache   }
882681f929fSNicolas Vasilache };
883681f929fSNicolas Vasilache 
88430e6033bSNicolas Vasilache /// Returns the strides if the memory underlying `memRefType` has a contiguous
88530e6033bSNicolas Vasilache /// static layout.
88630e6033bSNicolas Vasilache static llvm::Optional<SmallVector<int64_t, 4>>
computeContiguousStrides(MemRefType memRefType)88730e6033bSNicolas Vasilache computeContiguousStrides(MemRefType memRefType) {
8882bf491c7SBenjamin Kramer   int64_t offset;
88930e6033bSNicolas Vasilache   SmallVector<int64_t, 4> strides;
89030e6033bSNicolas Vasilache   if (failed(getStridesAndOffset(memRefType, strides, offset)))
89130e6033bSNicolas Vasilache     return None;
89230e6033bSNicolas Vasilache   if (!strides.empty() && strides.back() != 1)
89330e6033bSNicolas Vasilache     return None;
89430e6033bSNicolas Vasilache   // If no layout or identity layout, this is contiguous by definition.
895e41ebbecSVladislav Vinogradov   if (memRefType.getLayout().isIdentity())
89630e6033bSNicolas Vasilache     return strides;
89730e6033bSNicolas Vasilache 
89830e6033bSNicolas Vasilache   // Otherwise, we must determine contiguity form shapes. This can only ever
89930e6033bSNicolas Vasilache   // work in static cases because MemRefType is underspecified to represent
90030e6033bSNicolas Vasilache   // contiguous dynamic shapes in other ways than with just empty/identity
90130e6033bSNicolas Vasilache   // layout.
9022bf491c7SBenjamin Kramer   auto sizes = memRefType.getShape();
9035017b0f8SMatthias Springer   for (int index = 0, e = strides.size() - 1; index < e; ++index) {
90430e6033bSNicolas Vasilache     if (ShapedType::isDynamic(sizes[index + 1]) ||
90530e6033bSNicolas Vasilache         ShapedType::isDynamicStrideOrOffset(strides[index]) ||
90630e6033bSNicolas Vasilache         ShapedType::isDynamicStrideOrOffset(strides[index + 1]))
90730e6033bSNicolas Vasilache       return None;
90830e6033bSNicolas Vasilache     if (strides[index] != strides[index + 1] * sizes[index + 1])
90930e6033bSNicolas Vasilache       return None;
9102bf491c7SBenjamin Kramer   }
91130e6033bSNicolas Vasilache   return strides;
9122bf491c7SBenjamin Kramer }
9132bf491c7SBenjamin Kramer 
914563879b6SRahul Joshi class VectorTypeCastOpConversion
915563879b6SRahul Joshi     : public ConvertOpToLLVMPattern<vector::TypeCastOp> {
9165c0c51a9SNicolas Vasilache public:
917563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::TypeCastOp>::ConvertOpToLLVMPattern;
9185c0c51a9SNicolas Vasilache 
9193145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::TypeCastOp castOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const920ef976337SRiver Riddle   matchAndRewrite(vector::TypeCastOp castOp, OpAdaptor adaptor,
9215c0c51a9SNicolas Vasilache                   ConversionPatternRewriter &rewriter) const override {
922563879b6SRahul Joshi     auto loc = castOp->getLoc();
9235c0c51a9SNicolas Vasilache     MemRefType sourceMemRefType =
9242bdf33ccSRiver Riddle         castOp.getOperand().getType().cast<MemRefType>();
9259eb3e564SChris Lattner     MemRefType targetMemRefType = castOp.getType();
9265c0c51a9SNicolas Vasilache 
9275c0c51a9SNicolas Vasilache     // Only static shape casts supported atm.
9285c0c51a9SNicolas Vasilache     if (!sourceMemRefType.hasStaticShape() ||
9295c0c51a9SNicolas Vasilache         !targetMemRefType.hasStaticShape())
9303145427dSRiver Riddle       return failure();
9315c0c51a9SNicolas Vasilache 
9325c0c51a9SNicolas Vasilache     auto llvmSourceDescriptorTy =
933ef976337SRiver Riddle         adaptor.getOperands()[0].getType().dyn_cast<LLVM::LLVMStructType>();
9348de43b92SAlex Zinenko     if (!llvmSourceDescriptorTy)
9353145427dSRiver Riddle       return failure();
936ef976337SRiver Riddle     MemRefDescriptor sourceMemRef(adaptor.getOperands()[0]);
9375c0c51a9SNicolas Vasilache 
938dcec2ca5SChristian Sigg     auto llvmTargetDescriptorTy = typeConverter->convertType(targetMemRefType)
9398de43b92SAlex Zinenko                                       .dyn_cast_or_null<LLVM::LLVMStructType>();
9408de43b92SAlex Zinenko     if (!llvmTargetDescriptorTy)
9413145427dSRiver Riddle       return failure();
9425c0c51a9SNicolas Vasilache 
94330e6033bSNicolas Vasilache     // Only contiguous source buffers supported atm.
94430e6033bSNicolas Vasilache     auto sourceStrides = computeContiguousStrides(sourceMemRefType);
94530e6033bSNicolas Vasilache     if (!sourceStrides)
94630e6033bSNicolas Vasilache       return failure();
94730e6033bSNicolas Vasilache     auto targetStrides = computeContiguousStrides(targetMemRefType);
94830e6033bSNicolas Vasilache     if (!targetStrides)
94930e6033bSNicolas Vasilache       return failure();
95030e6033bSNicolas Vasilache     // Only support static strides for now, regardless of contiguity.
951*380a1b20SKazu Hirata     if (llvm::any_of(*targetStrides, ShapedType::isDynamicStrideOrOffset))
9523145427dSRiver Riddle       return failure();
9535c0c51a9SNicolas Vasilache 
9542230bf99SAlex Zinenko     auto int64Ty = IntegerType::get(rewriter.getContext(), 64);
9555c0c51a9SNicolas Vasilache 
9565c0c51a9SNicolas Vasilache     // Create descriptor.
9575c0c51a9SNicolas Vasilache     auto desc = MemRefDescriptor::undef(rewriter, loc, llvmTargetDescriptorTy);
9583a577f54SChristian Sigg     Type llvmTargetElementTy = desc.getElementPtrType();
9595c0c51a9SNicolas Vasilache     // Set allocated ptr.
960e62a6956SRiver Riddle     Value allocated = sourceMemRef.allocatedPtr(rewriter, loc);
9615c0c51a9SNicolas Vasilache     allocated =
9625c0c51a9SNicolas Vasilache         rewriter.create<LLVM::BitcastOp>(loc, llvmTargetElementTy, allocated);
9635c0c51a9SNicolas Vasilache     desc.setAllocatedPtr(rewriter, loc, allocated);
9645c0c51a9SNicolas Vasilache     // Set aligned ptr.
965e62a6956SRiver Riddle     Value ptr = sourceMemRef.alignedPtr(rewriter, loc);
9665c0c51a9SNicolas Vasilache     ptr = rewriter.create<LLVM::BitcastOp>(loc, llvmTargetElementTy, ptr);
9675c0c51a9SNicolas Vasilache     desc.setAlignedPtr(rewriter, loc, ptr);
9685c0c51a9SNicolas Vasilache     // Fill offset 0.
9695c0c51a9SNicolas Vasilache     auto attr = rewriter.getIntegerAttr(rewriter.getIndexType(), 0);
9705c0c51a9SNicolas Vasilache     auto zero = rewriter.create<LLVM::ConstantOp>(loc, int64Ty, attr);
9715c0c51a9SNicolas Vasilache     desc.setOffset(rewriter, loc, zero);
9725c0c51a9SNicolas Vasilache 
9735c0c51a9SNicolas Vasilache     // Fill size and stride descriptors in memref.
974e4853be2SMehdi Amini     for (const auto &indexedSize :
975e4853be2SMehdi Amini          llvm::enumerate(targetMemRefType.getShape())) {
9765c0c51a9SNicolas Vasilache       int64_t index = indexedSize.index();
9775c0c51a9SNicolas Vasilache       auto sizeAttr =
9785c0c51a9SNicolas Vasilache           rewriter.getIntegerAttr(rewriter.getIndexType(), indexedSize.value());
9795c0c51a9SNicolas Vasilache       auto size = rewriter.create<LLVM::ConstantOp>(loc, int64Ty, sizeAttr);
9805c0c51a9SNicolas Vasilache       desc.setSize(rewriter, loc, index, size);
98130e6033bSNicolas Vasilache       auto strideAttr = rewriter.getIntegerAttr(rewriter.getIndexType(),
98230e6033bSNicolas Vasilache                                                 (*targetStrides)[index]);
9835c0c51a9SNicolas Vasilache       auto stride = rewriter.create<LLVM::ConstantOp>(loc, int64Ty, strideAttr);
9845c0c51a9SNicolas Vasilache       desc.setStride(rewriter, loc, index, stride);
9855c0c51a9SNicolas Vasilache     }
9865c0c51a9SNicolas Vasilache 
987563879b6SRahul Joshi     rewriter.replaceOp(castOp, {desc});
9883145427dSRiver Riddle     return success();
9895c0c51a9SNicolas Vasilache   }
9905c0c51a9SNicolas Vasilache };
9915c0c51a9SNicolas Vasilache 
992a75a46dbSJavier Setoain /// Conversion pattern for a `vector.create_mask` (1-D scalable vectors only).
993a75a46dbSJavier Setoain /// Non-scalable versions of this operation are handled in Vector Transforms.
994a75a46dbSJavier Setoain class VectorCreateMaskOpRewritePattern
995a75a46dbSJavier Setoain     : public OpRewritePattern<vector::CreateMaskOp> {
996a75a46dbSJavier Setoain public:
VectorCreateMaskOpRewritePattern(MLIRContext * context,bool enableIndexOpt)997a75a46dbSJavier Setoain   explicit VectorCreateMaskOpRewritePattern(MLIRContext *context,
998a75a46dbSJavier Setoain                                             bool enableIndexOpt)
999a75a46dbSJavier Setoain       : OpRewritePattern<vector::CreateMaskOp>(context),
10007bc8ad51SJavier Setoain         force32BitVectorIndices(enableIndexOpt) {}
1001a75a46dbSJavier Setoain 
matchAndRewrite(vector::CreateMaskOp op,PatternRewriter & rewriter) const1002a75a46dbSJavier Setoain   LogicalResult matchAndRewrite(vector::CreateMaskOp op,
1003a75a46dbSJavier Setoain                                 PatternRewriter &rewriter) const override {
1004a75a46dbSJavier Setoain     auto dstType = op.getType();
1005a75a46dbSJavier Setoain     if (dstType.getRank() != 1 || !dstType.cast<VectorType>().isScalable())
1006a75a46dbSJavier Setoain       return failure();
1007a75a46dbSJavier Setoain     IntegerType idxType =
10087bc8ad51SJavier Setoain         force32BitVectorIndices ? rewriter.getI32Type() : rewriter.getI64Type();
1009a75a46dbSJavier Setoain     auto loc = op->getLoc();
1010a75a46dbSJavier Setoain     Value indices = rewriter.create<LLVM::StepVectorOp>(
1011a75a46dbSJavier Setoain         loc, LLVM::getVectorType(idxType, dstType.getShape()[0],
1012a75a46dbSJavier Setoain                                  /*isScalable=*/true));
1013a75a46dbSJavier Setoain     auto bound = getValueOrCreateCastToIndexLike(rewriter, loc, idxType,
1014a75a46dbSJavier Setoain                                                  op.getOperand(0));
1015a75a46dbSJavier Setoain     Value bounds = rewriter.create<SplatOp>(loc, indices.getType(), bound);
1016a75a46dbSJavier Setoain     Value comp = rewriter.create<arith::CmpIOp>(loc, arith::CmpIPredicate::slt,
1017a75a46dbSJavier Setoain                                                 indices, bounds);
1018a75a46dbSJavier Setoain     rewriter.replaceOp(op, comp);
1019a75a46dbSJavier Setoain     return success();
1020a75a46dbSJavier Setoain   }
1021a75a46dbSJavier Setoain 
1022a75a46dbSJavier Setoain private:
10237bc8ad51SJavier Setoain   const bool force32BitVectorIndices;
1024a75a46dbSJavier Setoain };
1025a75a46dbSJavier Setoain 
1026563879b6SRahul Joshi class VectorPrintOpConversion : public ConvertOpToLLVMPattern<vector::PrintOp> {
1027d9b500d3SAart Bik public:
1028563879b6SRahul Joshi   using ConvertOpToLLVMPattern<vector::PrintOp>::ConvertOpToLLVMPattern;
1029d9b500d3SAart Bik 
1030d9b500d3SAart Bik   // Proof-of-concept lowering implementation that relies on a small
1031d9b500d3SAart Bik   // runtime support library, which only needs to provide a few
1032d9b500d3SAart Bik   // printing methods (single value for all data types, opening/closing
1033d9b500d3SAart Bik   // bracket, comma, newline). The lowering fully unrolls a vector
1034d9b500d3SAart Bik   // in terms of these elementary printing operations. The advantage
1035d9b500d3SAart Bik   // of this approach is that the library can remain unaware of all
1036d9b500d3SAart Bik   // low-level implementation details of vectors while still supporting
1037d9b500d3SAart Bik   // output of any shaped and dimensioned vector. Due to full unrolling,
1038d9b500d3SAart Bik   // this approach is less suited for very large vectors though.
1039d9b500d3SAart Bik   //
10409db53a18SRiver Riddle   // TODO: rely solely on libc in future? something else?
1041d9b500d3SAart Bik   //
10423145427dSRiver Riddle   LogicalResult
matchAndRewrite(vector::PrintOp printOp,OpAdaptor adaptor,ConversionPatternRewriter & rewriter) const1043ef976337SRiver Riddle   matchAndRewrite(vector::PrintOp printOp, OpAdaptor adaptor,
1044d9b500d3SAart Bik                   ConversionPatternRewriter &rewriter) const override {
1045d9b500d3SAart Bik     Type printType = printOp.getPrintType();
1046d9b500d3SAart Bik 
1047dcec2ca5SChristian Sigg     if (typeConverter->convertType(printType) == nullptr)
10483145427dSRiver Riddle       return failure();
1049d9b500d3SAart Bik 
1050b8880f5fSAart Bik     // Make sure element type has runtime support.
1051b8880f5fSAart Bik     PrintConversion conversion = PrintConversion::None;
1052d9b500d3SAart Bik     VectorType vectorType = printType.dyn_cast<VectorType>();
1053d9b500d3SAart Bik     Type eltType = vectorType ? vectorType.getElementType() : printType;
1054d9b500d3SAart Bik     Operation *printer;
1055b8880f5fSAart Bik     if (eltType.isF32()) {
1056e332c22cSNicolas Vasilache       printer =
1057e332c22cSNicolas Vasilache           LLVM::lookupOrCreatePrintF32Fn(printOp->getParentOfType<ModuleOp>());
1058b8880f5fSAart Bik     } else if (eltType.isF64()) {
1059e332c22cSNicolas Vasilache       printer =
1060e332c22cSNicolas Vasilache           LLVM::lookupOrCreatePrintF64Fn(printOp->getParentOfType<ModuleOp>());
106154759cefSAart Bik     } else if (eltType.isIndex()) {
1062e332c22cSNicolas Vasilache       printer =
1063e332c22cSNicolas Vasilache           LLVM::lookupOrCreatePrintU64Fn(printOp->getParentOfType<ModuleOp>());
1064b8880f5fSAart Bik     } else if (auto intTy = eltType.dyn_cast<IntegerType>()) {
1065b8880f5fSAart Bik       // Integers need a zero or sign extension on the operand
1066b8880f5fSAart Bik       // (depending on the source type) as well as a signed or
1067b8880f5fSAart Bik       // unsigned print method. Up to 64-bit is supported.
1068b8880f5fSAart Bik       unsigned width = intTy.getWidth();
1069b8880f5fSAart Bik       if (intTy.isUnsigned()) {
107054759cefSAart Bik         if (width <= 64) {
1071b8880f5fSAart Bik           if (width < 64)
1072b8880f5fSAart Bik             conversion = PrintConversion::ZeroExt64;
1073e332c22cSNicolas Vasilache           printer = LLVM::lookupOrCreatePrintU64Fn(
1074e332c22cSNicolas Vasilache               printOp->getParentOfType<ModuleOp>());
1075b8880f5fSAart Bik         } else {
10763145427dSRiver Riddle           return failure();
1077b8880f5fSAart Bik         }
1078b8880f5fSAart Bik       } else {
1079b8880f5fSAart Bik         assert(intTy.isSignless() || intTy.isSigned());
108054759cefSAart Bik         if (width <= 64) {
1081b8880f5fSAart Bik           // Note that we *always* zero extend booleans (1-bit integers),
1082b8880f5fSAart Bik           // so that true/false is printed as 1/0 rather than -1/0.
1083b8880f5fSAart Bik           if (width == 1)
108454759cefSAart Bik             conversion = PrintConversion::ZeroExt64;
108554759cefSAart Bik           else if (width < 64)
1086b8880f5fSAart Bik             conversion = PrintConversion::SignExt64;
1087e332c22cSNicolas Vasilache           printer = LLVM::lookupOrCreatePrintI64Fn(
1088e332c22cSNicolas Vasilache               printOp->getParentOfType<ModuleOp>());
1089b8880f5fSAart Bik         } else {
1090b8880f5fSAart Bik           return failure();
1091b8880f5fSAart Bik         }
1092b8880f5fSAart Bik       }
1093b8880f5fSAart Bik     } else {
1094b8880f5fSAart Bik       return failure();
1095b8880f5fSAart Bik     }
1096d9b500d3SAart Bik 
1097d9b500d3SAart Bik     // Unroll vector into elementary print calls.
1098b8880f5fSAart Bik     int64_t rank = vectorType ? vectorType.getRank() : 0;
1099cc311a15SMichal Terepeta     Type type = vectorType ? vectorType : eltType;
11007c38fd60SJacques Pienaar     emitRanks(rewriter, printOp, adaptor.getSource(), type, printer, rank,
1101b8880f5fSAart Bik               conversion);
1102e332c22cSNicolas Vasilache     emitCall(rewriter, printOp->getLoc(),
1103e332c22cSNicolas Vasilache              LLVM::lookupOrCreatePrintNewlineFn(
1104e332c22cSNicolas Vasilache                  printOp->getParentOfType<ModuleOp>()));
1105563879b6SRahul Joshi     rewriter.eraseOp(printOp);
11063145427dSRiver Riddle     return success();
1107d9b500d3SAart Bik   }
1108d9b500d3SAart Bik 
1109d9b500d3SAart Bik private:
1110b8880f5fSAart Bik   enum class PrintConversion {
111130e6033bSNicolas Vasilache     // clang-format off
1112b8880f5fSAart Bik     None,
1113b8880f5fSAart Bik     ZeroExt64,
1114b8880f5fSAart Bik     SignExt64
111530e6033bSNicolas Vasilache     // clang-format on
1116b8880f5fSAart Bik   };
1117b8880f5fSAart Bik 
emitRanks(ConversionPatternRewriter & rewriter,Operation * op,Value value,Type type,Operation * printer,int64_t rank,PrintConversion conversion) const1118d9b500d3SAart Bik   void emitRanks(ConversionPatternRewriter &rewriter, Operation *op,
1119cc311a15SMichal Terepeta                  Value value, Type type, Operation *printer, int64_t rank,
1120cc311a15SMichal Terepeta                  PrintConversion conversion) const {
1121cc311a15SMichal Terepeta     VectorType vectorType = type.dyn_cast<VectorType>();
1122d9b500d3SAart Bik     Location loc = op->getLoc();
1123cc311a15SMichal Terepeta     if (!vectorType) {
1124cc311a15SMichal Terepeta       assert(rank == 0 && "The scalar case expects rank == 0");
1125b8880f5fSAart Bik       switch (conversion) {
1126b8880f5fSAart Bik       case PrintConversion::ZeroExt64:
1127a54f4eaeSMogball         value = rewriter.create<arith::ExtUIOp>(
11283c69bc4dSRiver Riddle             loc, IntegerType::get(rewriter.getContext(), 64), value);
1129b8880f5fSAart Bik         break;
1130b8880f5fSAart Bik       case PrintConversion::SignExt64:
1131a54f4eaeSMogball         value = rewriter.create<arith::ExtSIOp>(
11323c69bc4dSRiver Riddle             loc, IntegerType::get(rewriter.getContext(), 64), value);
1133b8880f5fSAart Bik         break;
1134b8880f5fSAart Bik       case PrintConversion::None:
1135b8880f5fSAart Bik         break;
1136c9eeeb38Saartbik       }
1137d9b500d3SAart Bik       emitCall(rewriter, loc, printer, value);
1138d9b500d3SAart Bik       return;
1139d9b500d3SAart Bik     }
1140d9b500d3SAart Bik 
1141e332c22cSNicolas Vasilache     emitCall(rewriter, loc,
1142e332c22cSNicolas Vasilache              LLVM::lookupOrCreatePrintOpenFn(op->getParentOfType<ModuleOp>()));
1143e332c22cSNicolas Vasilache     Operation *printComma =
1144e332c22cSNicolas Vasilache         LLVM::lookupOrCreatePrintCommaFn(op->getParentOfType<ModuleOp>());
1145cc311a15SMichal Terepeta 
1146cc311a15SMichal Terepeta     if (rank <= 1) {
1147cc311a15SMichal Terepeta       auto reducedType = vectorType.getElementType();
1148cc311a15SMichal Terepeta       auto llvmType = typeConverter->convertType(reducedType);
1149cc311a15SMichal Terepeta       int64_t dim = rank == 0 ? 1 : vectorType.getDimSize(0);
1150cc311a15SMichal Terepeta       for (int64_t d = 0; d < dim; ++d) {
1151cc311a15SMichal Terepeta         Value nestedVal = extractOne(rewriter, *getTypeConverter(), loc, value,
1152cc311a15SMichal Terepeta                                      llvmType, /*rank=*/0, /*pos=*/d);
1153cc311a15SMichal Terepeta         emitRanks(rewriter, op, nestedVal, reducedType, printer, /*rank=*/0,
1154cc311a15SMichal Terepeta                   conversion);
1155cc311a15SMichal Terepeta         if (d != dim - 1)
1156cc311a15SMichal Terepeta           emitCall(rewriter, loc, printComma);
1157cc311a15SMichal Terepeta       }
1158cc311a15SMichal Terepeta       emitCall(
1159cc311a15SMichal Terepeta           rewriter, loc,
1160cc311a15SMichal Terepeta           LLVM::lookupOrCreatePrintCloseFn(op->getParentOfType<ModuleOp>()));
1161cc311a15SMichal Terepeta       return;
1162cc311a15SMichal Terepeta     }
1163cc311a15SMichal Terepeta 
1164d9b500d3SAart Bik     int64_t dim = vectorType.getDimSize(0);
1165d9b500d3SAart Bik     for (int64_t d = 0; d < dim; ++d) {
1166cc311a15SMichal Terepeta       auto reducedType = reducedVectorTypeFront(vectorType);
1167cc311a15SMichal Terepeta       auto llvmType = typeConverter->convertType(reducedType);
1168dcec2ca5SChristian Sigg       Value nestedVal = extractOne(rewriter, *getTypeConverter(), loc, value,
1169dcec2ca5SChristian Sigg                                    llvmType, rank, d);
1170b8880f5fSAart Bik       emitRanks(rewriter, op, nestedVal, reducedType, printer, rank - 1,
1171b8880f5fSAart Bik                 conversion);
1172d9b500d3SAart Bik       if (d != dim - 1)
1173d9b500d3SAart Bik         emitCall(rewriter, loc, printComma);
1174d9b500d3SAart Bik     }
1175e332c22cSNicolas Vasilache     emitCall(rewriter, loc,
1176e332c22cSNicolas Vasilache              LLVM::lookupOrCreatePrintCloseFn(op->getParentOfType<ModuleOp>()));
1177d9b500d3SAart Bik   }
1178d9b500d3SAart Bik 
1179d9b500d3SAart Bik   // Helper to emit a call.
emitCall(ConversionPatternRewriter & rewriter,Location loc,Operation * ref,ValueRange params=ValueRange ())1180d9b500d3SAart Bik   static void emitCall(ConversionPatternRewriter &rewriter, Location loc,
1181d9b500d3SAart Bik                        Operation *ref, ValueRange params = ValueRange()) {
1182faf1c224SChris Lattner     rewriter.create<LLVM::CallOp>(loc, TypeRange(), SymbolRefAttr::get(ref),
1183faf1c224SChris Lattner                                   params);
1184d9b500d3SAart Bik   }
1185d9b500d3SAart Bik };
1186d9b500d3SAart Bik 
11876a8ba318SRiver Riddle /// The Splat operation is lowered to an insertelement + a shufflevector
11886a8ba318SRiver Riddle /// operation. Splat to only 0-d and 1-d vector result types are lowered.
11896a8ba318SRiver Riddle struct VectorSplatOpLowering : public ConvertOpToLLVMPattern<vector::SplatOp> {
11906a8ba318SRiver Riddle   using ConvertOpToLLVMPattern<vector::SplatOp>::ConvertOpToLLVMPattern;
11916a8ba318SRiver Riddle 
11926a8ba318SRiver Riddle   LogicalResult
matchAndRewrite__anon9084af800111::VectorSplatOpLowering11936a8ba318SRiver Riddle   matchAndRewrite(vector::SplatOp splatOp, OpAdaptor adaptor,
11946a8ba318SRiver Riddle                   ConversionPatternRewriter &rewriter) const override {
11956a8ba318SRiver Riddle     VectorType resultType = splatOp.getType().cast<VectorType>();
11966a8ba318SRiver Riddle     if (resultType.getRank() > 1)
11976a8ba318SRiver Riddle       return failure();
11986a8ba318SRiver Riddle 
11996a8ba318SRiver Riddle     // First insert it into an undef vector so we can shuffle it.
12006a8ba318SRiver Riddle     auto vectorType = typeConverter->convertType(splatOp.getType());
12016a8ba318SRiver Riddle     Value undef = rewriter.create<LLVM::UndefOp>(splatOp.getLoc(), vectorType);
12026a8ba318SRiver Riddle     auto zero = rewriter.create<LLVM::ConstantOp>(
12036a8ba318SRiver Riddle         splatOp.getLoc(),
12046a8ba318SRiver Riddle         typeConverter->convertType(rewriter.getIntegerType(32)),
12056a8ba318SRiver Riddle         rewriter.getZeroAttr(rewriter.getIntegerType(32)));
12066a8ba318SRiver Riddle 
12076a8ba318SRiver Riddle     // For 0-d vector, we simply do `insertelement`.
12086a8ba318SRiver Riddle     if (resultType.getRank() == 0) {
12096a8ba318SRiver Riddle       rewriter.replaceOpWithNewOp<LLVM::InsertElementOp>(
12107c38fd60SJacques Pienaar           splatOp, vectorType, undef, adaptor.getInput(), zero);
12116a8ba318SRiver Riddle       return success();
12126a8ba318SRiver Riddle     }
12136a8ba318SRiver Riddle 
12146a8ba318SRiver Riddle     // For 1-d vector, we additionally do a `vectorshuffle`.
12156a8ba318SRiver Riddle     auto v = rewriter.create<LLVM::InsertElementOp>(
12167c38fd60SJacques Pienaar         splatOp.getLoc(), vectorType, undef, adaptor.getInput(), zero);
12176a8ba318SRiver Riddle 
12186a8ba318SRiver Riddle     int64_t width = splatOp.getType().cast<VectorType>().getDimSize(0);
12196a8ba318SRiver Riddle     SmallVector<int32_t, 4> zeroValues(width, 0);
12206a8ba318SRiver Riddle 
12216a8ba318SRiver Riddle     // Shuffle the value across the desired number of elements.
12226a8ba318SRiver Riddle     ArrayAttr zeroAttrs = rewriter.getI32ArrayAttr(zeroValues);
12236a8ba318SRiver Riddle     rewriter.replaceOpWithNewOp<LLVM::ShuffleVectorOp>(splatOp, v, undef,
12246a8ba318SRiver Riddle                                                        zeroAttrs);
12256a8ba318SRiver Riddle     return success();
12266a8ba318SRiver Riddle   }
12276a8ba318SRiver Riddle };
12286a8ba318SRiver Riddle 
12296a8ba318SRiver Riddle /// The Splat operation is lowered to an insertelement + a shufflevector
12306a8ba318SRiver Riddle /// operation. Splat to only 2+-d vector result types are lowered by the
12316a8ba318SRiver Riddle /// SplatNdOpLowering, the 1-d case is handled by SplatOpLowering.
12326a8ba318SRiver Riddle struct VectorSplatNdOpLowering : public ConvertOpToLLVMPattern<SplatOp> {
12336a8ba318SRiver Riddle   using ConvertOpToLLVMPattern<SplatOp>::ConvertOpToLLVMPattern;
12346a8ba318SRiver Riddle 
12356a8ba318SRiver Riddle   LogicalResult
matchAndRewrite__anon9084af800111::VectorSplatNdOpLowering12366a8ba318SRiver Riddle   matchAndRewrite(SplatOp splatOp, OpAdaptor adaptor,
12376a8ba318SRiver Riddle                   ConversionPatternRewriter &rewriter) const override {
12386a8ba318SRiver Riddle     VectorType resultType = splatOp.getType();
12396a8ba318SRiver Riddle     if (resultType.getRank() <= 1)
12406a8ba318SRiver Riddle       return failure();
12416a8ba318SRiver Riddle 
12426a8ba318SRiver Riddle     // First insert it into an undef vector so we can shuffle it.
12436a8ba318SRiver Riddle     auto loc = splatOp.getLoc();
12446a8ba318SRiver Riddle     auto vectorTypeInfo =
12456a8ba318SRiver Riddle         LLVM::detail::extractNDVectorTypeInfo(resultType, *getTypeConverter());
12466a8ba318SRiver Riddle     auto llvmNDVectorTy = vectorTypeInfo.llvmNDVectorTy;
12476a8ba318SRiver Riddle     auto llvm1DVectorTy = vectorTypeInfo.llvm1DVectorTy;
12486a8ba318SRiver Riddle     if (!llvmNDVectorTy || !llvm1DVectorTy)
12496a8ba318SRiver Riddle       return failure();
12506a8ba318SRiver Riddle 
12516a8ba318SRiver Riddle     // Construct returned value.
12526a8ba318SRiver Riddle     Value desc = rewriter.create<LLVM::UndefOp>(loc, llvmNDVectorTy);
12536a8ba318SRiver Riddle 
12546a8ba318SRiver Riddle     // Construct a 1-D vector with the splatted value that we insert in all the
12556a8ba318SRiver Riddle     // places within the returned descriptor.
12566a8ba318SRiver Riddle     Value vdesc = rewriter.create<LLVM::UndefOp>(loc, llvm1DVectorTy);
12576a8ba318SRiver Riddle     auto zero = rewriter.create<LLVM::ConstantOp>(
12586a8ba318SRiver Riddle         loc, typeConverter->convertType(rewriter.getIntegerType(32)),
12596a8ba318SRiver Riddle         rewriter.getZeroAttr(rewriter.getIntegerType(32)));
12606a8ba318SRiver Riddle     Value v = rewriter.create<LLVM::InsertElementOp>(loc, llvm1DVectorTy, vdesc,
12617c38fd60SJacques Pienaar                                                      adaptor.getInput(), zero);
12626a8ba318SRiver Riddle 
12636a8ba318SRiver Riddle     // Shuffle the value across the desired number of elements.
12646a8ba318SRiver Riddle     int64_t width = resultType.getDimSize(resultType.getRank() - 1);
12656a8ba318SRiver Riddle     SmallVector<int32_t, 4> zeroValues(width, 0);
12666a8ba318SRiver Riddle     ArrayAttr zeroAttrs = rewriter.getI32ArrayAttr(zeroValues);
12676a8ba318SRiver Riddle     v = rewriter.create<LLVM::ShuffleVectorOp>(loc, v, v, zeroAttrs);
12686a8ba318SRiver Riddle 
12696a8ba318SRiver Riddle     // Iterate of linear index, convert to coords space and insert splatted 1-D
12706a8ba318SRiver Riddle     // vector in each position.
12716a8ba318SRiver Riddle     nDVectorIterate(vectorTypeInfo, rewriter, [&](ArrayAttr position) {
12726a8ba318SRiver Riddle       desc = rewriter.create<LLVM::InsertValueOp>(loc, llvmNDVectorTy, desc, v,
12736a8ba318SRiver Riddle                                                   position);
12746a8ba318SRiver Riddle     });
12756a8ba318SRiver Riddle     rewriter.replaceOp(splatOp, desc);
12766a8ba318SRiver Riddle     return success();
12776a8ba318SRiver Riddle   }
12786a8ba318SRiver Riddle };
12796a8ba318SRiver Riddle 
1280df186507SBenjamin Kramer } // namespace
1281df186507SBenjamin Kramer 
12825c0c51a9SNicolas Vasilache /// Populate the given list with patterns that convert from Vector to LLVM.
populateVectorToLLVMConversionPatterns(LLVMTypeConverter & converter,RewritePatternSet & patterns,bool reassociateFPReductions,bool force32BitVectorIndices)12837bc8ad51SJavier Setoain void mlir::populateVectorToLLVMConversionPatterns(
12847bc8ad51SJavier Setoain     LLVMTypeConverter &converter, RewritePatternSet &patterns,
12857bc8ad51SJavier Setoain     bool reassociateFPReductions, bool force32BitVectorIndices) {
128665678d93SNicolas Vasilache   MLIRContext *ctx = converter.getDialect()->getContext();
1287eda2ebd7SNicolas Vasilache   patterns.add<VectorFMAOpNDRewritePattern>(ctx);
1288eda2ebd7SNicolas Vasilache   populateVectorInsertExtractStridedSliceTransforms(patterns);
1289dc4e913bSChris Lattner   patterns.add<VectorReductionOpConversion>(converter, reassociateFPReductions);
12907bc8ad51SJavier Setoain   patterns.add<VectorCreateMaskOpRewritePattern>(ctx, force32BitVectorIndices);
12918345b86dSNicolas Vasilache   patterns
1292dc4e913bSChris Lattner       .add<VectorBitCastOpConversion, VectorShuffleOpConversion,
1293dc4e913bSChris Lattner            VectorExtractElementOpConversion, VectorExtractOpConversion,
1294dc4e913bSChris Lattner            VectorFMAOp1DConversion, VectorInsertElementOpConversion,
1295dc4e913bSChris Lattner            VectorInsertOpConversion, VectorPrintOpConversion,
1296a4830d14SJavier Setoain            VectorTypeCastOpConversion, VectorScaleOpConversion,
1297dc4e913bSChris Lattner            VectorLoadStoreConversion<vector::LoadOp, vector::LoadOpAdaptor>,
1298ee66e43aSDiego Caballero            VectorLoadStoreConversion<vector::MaskedLoadOp,
1299ee66e43aSDiego Caballero                                      vector::MaskedLoadOpAdaptor>,
1300dc4e913bSChris Lattner            VectorLoadStoreConversion<vector::StoreOp, vector::StoreOpAdaptor>,
1301ee66e43aSDiego Caballero            VectorLoadStoreConversion<vector::MaskedStoreOp,
1302ee66e43aSDiego Caballero                                      vector::MaskedStoreOpAdaptor>,
1303dc4e913bSChris Lattner            VectorGatherOpConversion, VectorScatterOpConversion,
13046a8ba318SRiver Riddle            VectorExpandLoadOpConversion, VectorCompressStoreOpConversion,
13056a8ba318SRiver Riddle            VectorSplatOpLowering, VectorSplatNdOpLowering>(converter);
1306d1a9e9a7SMatthias Springer   // Transfer ops with rank > 1 are handled by VectorToSCF.
1307d1a9e9a7SMatthias Springer   populateVectorTransferLoweringPatterns(patterns, /*maxTransferRank=*/1);
13085c0c51a9SNicolas Vasilache }
13095c0c51a9SNicolas Vasilache 
populateVectorToLLVMMatrixConversionPatterns(LLVMTypeConverter & converter,RewritePatternSet & patterns)131063b683a8SNicolas Vasilache void mlir::populateVectorToLLVMMatrixConversionPatterns(
1311dc4e913bSChris Lattner     LLVMTypeConverter &converter, RewritePatternSet &patterns) {
1312dc4e913bSChris Lattner   patterns.add<VectorMatmulOpConversion>(converter);
1313dc4e913bSChris Lattner   patterns.add<VectorFlatTransposeOpConversion>(converter);
131463b683a8SNicolas Vasilache }
1315