Vector/Utils/VectorUtils.cpp

99ef9eebSMatthias Springer//===- VectorUtils.cpp - MLIR Utilities for VectorOps   ------------------===//
99ef9eebSMatthias Springer//
99ef9eebSMatthias Springer// Part of the MLIR Project, under the Apache License v2.0 with LLVM Exceptions.
99ef9eebSMatthias Springer// See https://llvm.org/LICENSE.txt for license information.
99ef9eebSMatthias Springer// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
99ef9eebSMatthias Springer//
99ef9eebSMatthias Springer//===----------------------------------------------------------------------===//
99ef9eebSMatthias Springer//
99ef9eebSMatthias Springer// This file implements utility methods for working with the Vector dialect.
99ef9eebSMatthias Springer//
99ef9eebSMatthias Springer//===----------------------------------------------------------------------===//
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer#include "mlir/Dialect/Vector/Utils/VectorUtils.h"
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer#include "mlir/Dialect/Affine/Analysis/LoopAnalysis.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/Affine/IR/AffineOps.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/Arithmetic/IR/Arithmetic.h"
23aa5a74SRiver Riddle#include "mlir/Dialect/Func/IR/FuncOps.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/MemRef/IR/MemRef.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/Tensor/IR/Tensor.h"
99ef9eebSMatthias Springer#include "mlir/Dialect/Vector/IR/VectorOps.h"
99ef9eebSMatthias Springer#include "mlir/IR/Builders.h"
99ef9eebSMatthias Springer#include "mlir/IR/IntegerSet.h"
99ef9eebSMatthias Springer#include "mlir/IR/Operation.h"
9b5a3d14SMatthias Springer#include "mlir/IR/TypeUtilities.h"
99ef9eebSMatthias Springer#include "mlir/Support/LLVM.h"
99ef9eebSMatthias Springer#include "mlir/Support/MathExtras.h"
99ef9eebSMatthias Springer#include <numeric>
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer#include "llvm/ADT/DenseSet.h"
99ef9eebSMatthias Springer#include "llvm/ADT/SetVector.h"
99ef9eebSMatthias Springer
99ef9eebSMatthias Springerusing namespace mlir;
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer/// Helper function that creates a memref::DimOp or tensor::DimOp depending on
99ef9eebSMatthias Springer/// the type of `source`.
99ef9eebSMatthias SpringerValue mlir::vector::createOrFoldDimOp(OpBuilder &b, Location loc, Value source,
99ef9eebSMatthias Springer                                      int64_t dim) {
99ef9eebSMatthias Springer  if (source.getType().isa<UnrankedMemRefType, MemRefType>())
99ef9eebSMatthias Springer    return b.createOrFold<memref::DimOp>(loc, source, dim);
99ef9eebSMatthias Springer  if (source.getType().isa<UnrankedTensorType, RankedTensorType>())
99ef9eebSMatthias Springer    return b.createOrFold<tensor::DimOp>(loc, source, dim);
99ef9eebSMatthias Springer  llvm_unreachable("Expected MemRefType or TensorType");
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer/// Return the number of elements of basis, `0` if empty.
99ef9eebSMatthias Springerint64_t mlir::computeMaxLinearIndex(ArrayRef<int64_t> basis) {
99ef9eebSMatthias Springer  if (basis.empty())
99ef9eebSMatthias Springer    return 0;
99ef9eebSMatthias Springer  return std::accumulate(basis.begin(), basis.end(), 1,
99ef9eebSMatthias Springer                         std::multiplies<int64_t>());
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias SpringerSmallVector<int64_t, 4> mlir::computeStrides(ArrayRef<int64_t> shape,
99ef9eebSMatthias Springer                                             ArrayRef<int64_t> sizes) {
99ef9eebSMatthias Springer  int64_t rank = shape.size();
99ef9eebSMatthias Springer  // Compute the count for each dimension.
99ef9eebSMatthias Springer  SmallVector<int64_t, 4> sliceDimCounts(rank);
99ef9eebSMatthias Springer  for (int64_t r = 0; r < rank; ++r)
99ef9eebSMatthias Springer    sliceDimCounts[r] = ceilDiv(shape[r], sizes[r]);
99ef9eebSMatthias Springer  // Use that to compute the slice stride for each dimension.
99ef9eebSMatthias Springer  SmallVector<int64_t, 4> sliceStrides(rank);
99ef9eebSMatthias Springer  sliceStrides[rank - 1] = 1;
99ef9eebSMatthias Springer  for (int64_t r = rank - 2; r >= 0; --r)
99ef9eebSMatthias Springer    sliceStrides[r] = sliceStrides[r + 1] * sliceDimCounts[r + 1];
99ef9eebSMatthias Springer  return sliceStrides;
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias SpringerSmallVector<int64_t, 4> mlir::computeElementOffsetsFromVectorSliceOffsets(
99ef9eebSMatthias Springer    ArrayRef<int64_t> sizes, ArrayRef<int64_t> vectorOffsets) {
99ef9eebSMatthias Springer  SmallVector<int64_t, 4> result;
99ef9eebSMatthias Springer  for (auto it : llvm::zip(vectorOffsets, sizes))
99ef9eebSMatthias Springer    result.push_back(std::get<0>(it) * std::get<1>(it));
99ef9eebSMatthias Springer  return result;
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias SpringerOptional<SmallVector<int64_t, 4>> mlir::shapeRatio(ArrayRef<int64_t> superShape,
99ef9eebSMatthias Springer                                                   ArrayRef<int64_t> subShape) {
99ef9eebSMatthias Springer  if (superShape.size() < subShape.size()) {
99ef9eebSMatthias Springer    return Optional<SmallVector<int64_t, 4>>();
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  // Starting from the end, compute the integer divisors.
99ef9eebSMatthias Springer  std::vector<int64_t> result;
99ef9eebSMatthias Springer  result.reserve(superShape.size());
99ef9eebSMatthias Springer  int64_t superSize = 0, subSize = 0;
99ef9eebSMatthias Springer  for (auto it :
99ef9eebSMatthias Springer       llvm::zip(llvm::reverse(superShape), llvm::reverse(subShape))) {
99ef9eebSMatthias Springer    std::tie(superSize, subSize) = it;
99ef9eebSMatthias Springer    assert(superSize > 0 && "superSize must be > 0");
99ef9eebSMatthias Springer    assert(subSize > 0 && "subSize must be > 0");
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer    // If integral division does not occur, return and let the caller decide.
99ef9eebSMatthias Springer    if (superSize % subSize != 0)
99ef9eebSMatthias Springer      return None;
99ef9eebSMatthias Springer    result.push_back(superSize / subSize);
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  // At this point we computed the ratio (in reverse) for the common
99ef9eebSMatthias Springer  // size. Fill with the remaining entries from the super-vector shape (still in
99ef9eebSMatthias Springer  // reverse).
99ef9eebSMatthias Springer  int commonSize = subShape.size();
99ef9eebSMatthias Springer  std::copy(superShape.rbegin() + commonSize, superShape.rend(),
99ef9eebSMatthias Springer            std::back_inserter(result));
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  assert(result.size() == superShape.size() &&
99ef9eebSMatthias Springer         "super to sub shape ratio is not of the same size as the super rank");
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  // Reverse again to get it back in the proper order and return.
99ef9eebSMatthias Springer  return SmallVector<int64_t, 4>{result.rbegin(), result.rend()};
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias SpringerOptional<SmallVector<int64_t, 4>> mlir::shapeRatio(VectorType superVectorType,
99ef9eebSMatthias Springer                                                   VectorType subVectorType) {
99ef9eebSMatthias Springer  assert(superVectorType.getElementType() == subVectorType.getElementType() &&
99ef9eebSMatthias Springer         "vector types must be of the same elemental type");
99ef9eebSMatthias Springer  return shapeRatio(superVectorType.getShape(), subVectorType.getShape());
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer/// Constructs a permutation map from memref indices to vector dimension.
99ef9eebSMatthias Springer///
99ef9eebSMatthias Springer/// The implementation uses the knowledge of the mapping of enclosing loop to
99ef9eebSMatthias Springer/// vector dimension. `enclosingLoopToVectorDim` carries this information as a
99ef9eebSMatthias Springer/// map with:
99ef9eebSMatthias Springer///   - keys representing "vectorized enclosing loops";
99ef9eebSMatthias Springer///   - values representing the corresponding vector dimension.
99ef9eebSMatthias Springer/// The algorithm traverses "vectorized enclosing loops" and extracts the
99ef9eebSMatthias Springer/// at-most-one MemRef index that is invariant along said loop. This index is
99ef9eebSMatthias Springer/// guaranteed to be at most one by construction: otherwise the MemRef is not
99ef9eebSMatthias Springer/// vectorizable.
99ef9eebSMatthias Springer/// If this invariant index is found, it is added to the permutation_map at the
99ef9eebSMatthias Springer/// proper vector dimension.
99ef9eebSMatthias Springer/// If no index is found to be invariant, 0 is added to the permutation_map and
99ef9eebSMatthias Springer/// corresponds to a vector broadcast along that dimension.
99ef9eebSMatthias Springer///
99ef9eebSMatthias Springer/// Returns an empty AffineMap if `enclosingLoopToVectorDim` is empty,
99ef9eebSMatthias Springer/// signalling that no permutation map can be constructed given
99ef9eebSMatthias Springer/// `enclosingLoopToVectorDim`.
99ef9eebSMatthias Springer///
99ef9eebSMatthias Springer/// Examples can be found in the documentation of `makePermutationMap`, in the
99ef9eebSMatthias Springer/// header file.
99ef9eebSMatthias Springerstatic AffineMap makePermutationMap(
99ef9eebSMatthias Springer    ArrayRef<Value> indices,
99ef9eebSMatthias Springer    const DenseMap<Operation *, unsigned> &enclosingLoopToVectorDim) {
99ef9eebSMatthias Springer  if (enclosingLoopToVectorDim.empty())
99ef9eebSMatthias Springer    return AffineMap();
99ef9eebSMatthias Springer  MLIRContext *context =
99ef9eebSMatthias Springer      enclosingLoopToVectorDim.begin()->getFirst()->getContext();
99ef9eebSMatthias Springer  SmallVector<AffineExpr, 4> perm(enclosingLoopToVectorDim.size(),
99ef9eebSMatthias Springer                                  getAffineConstantExpr(0, context));
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  for (auto kvp : enclosingLoopToVectorDim) {
99ef9eebSMatthias Springer    assert(kvp.second < perm.size());
99ef9eebSMatthias Springer    auto invariants = getInvariantAccesses(
99ef9eebSMatthias Springer        cast<AffineForOp>(kvp.first).getInductionVar(), indices);
99ef9eebSMatthias Springer    unsigned numIndices = indices.size();
99ef9eebSMatthias Springer    unsigned countInvariantIndices = 0;
99ef9eebSMatthias Springer    for (unsigned dim = 0; dim < numIndices; ++dim) {
99ef9eebSMatthias Springer      if (!invariants.count(indices[dim])) {
99ef9eebSMatthias Springer        assert(perm[kvp.second] == getAffineConstantExpr(0, context) &&
99ef9eebSMatthias Springer               "permutationMap already has an entry along dim");
99ef9eebSMatthias Springer        perm[kvp.second] = getAffineDimExpr(dim, context);
99ef9eebSMatthias Springer      } else {
99ef9eebSMatthias Springer        ++countInvariantIndices;
99ef9eebSMatthias Springer      }
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer    assert((countInvariantIndices == numIndices ||
99ef9eebSMatthias Springer            countInvariantIndices == numIndices - 1) &&
99ef9eebSMatthias Springer           "Vectorization prerequisite violated: at most 1 index may be "
99ef9eebSMatthias Springer           "invariant wrt a vectorized loop");
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer  return AffineMap::get(indices.size(), 0, perm, context);
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer/// Implementation detail that walks up the parents and records the ones with
99ef9eebSMatthias Springer/// the specified type.
99ef9eebSMatthias Springer/// TODO: could also be implemented as a collect parents followed by a
99ef9eebSMatthias Springer/// filter and made available outside this file.
99ef9eebSMatthias Springertemplate <typename T>
99ef9eebSMatthias Springerstatic SetVector<Operation *> getParentsOfType(Block *block) {
99ef9eebSMatthias Springer  SetVector<Operation *> res;
99ef9eebSMatthias Springer  auto *current = block->getParentOp();
99ef9eebSMatthias Springer  while (current) {
99ef9eebSMatthias Springer    if (auto typedParent = dyn_cast<T>(current)) {
99ef9eebSMatthias Springer      assert(res.count(current) == 0 && "Already inserted");
99ef9eebSMatthias Springer      res.insert(current);
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer    current = current->getParentOp();
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer  return res;
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer/// Returns the enclosing AffineForOp, from closest to farthest.
99ef9eebSMatthias Springerstatic SetVector<Operation *> getEnclosingforOps(Block *block) {
99ef9eebSMatthias Springer  return getParentsOfType<AffineForOp>(block);
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias SpringerAffineMap mlir::makePermutationMap(
99ef9eebSMatthias Springer    Block *insertPoint, ArrayRef<Value> indices,
99ef9eebSMatthias Springer    const DenseMap<Operation *, unsigned> &loopToVectorDim) {
99ef9eebSMatthias Springer  DenseMap<Operation *, unsigned> enclosingLoopToVectorDim;
99ef9eebSMatthias Springer  auto enclosingLoops = getEnclosingforOps(insertPoint);
99ef9eebSMatthias Springer  for (auto *forInst : enclosingLoops) {
99ef9eebSMatthias Springer    auto it = loopToVectorDim.find(forInst);
99ef9eebSMatthias Springer    if (it != loopToVectorDim.end()) {
99ef9eebSMatthias Springer      enclosingLoopToVectorDim.insert(*it);
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer  return ::makePermutationMap(indices, enclosingLoopToVectorDim);
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias SpringerAffineMap mlir::makePermutationMap(
99ef9eebSMatthias Springer    Operation *op, ArrayRef<Value> indices,
99ef9eebSMatthias Springer    const DenseMap<Operation *, unsigned> &loopToVectorDim) {
99ef9eebSMatthias Springer  return makePermutationMap(op->getBlock(), indices, loopToVectorDim);
99ef9eebSMatthias Springer}
99ef9eebSMatthias Springer
99ef9eebSMatthias Springerbool matcher::operatesOnSuperVectorsOf(Operation &op,
99ef9eebSMatthias Springer                                       VectorType subVectorType) {
99ef9eebSMatthias Springer  // First, extract the vector type and distinguish between:
99ef9eebSMatthias Springer  //   a. ops that *must* lower a super-vector (i.e. vector.transfer_read,
99ef9eebSMatthias Springer  //      vector.transfer_write); and
99ef9eebSMatthias Springer  //   b. ops that *may* lower a super-vector (all other ops).
99ef9eebSMatthias Springer  // The ops that *may* lower a super-vector only do so if the super-vector to
99ef9eebSMatthias Springer  // sub-vector ratio exists. The ops that *must* lower a super-vector are
99ef9eebSMatthias Springer  // explicitly checked for this property.
99ef9eebSMatthias Springer  /// TODO: there should be a single function for all ops to do this so we
99ef9eebSMatthias Springer  /// do not have to special case. Maybe a trait, or just a method, unclear atm.
99ef9eebSMatthias Springer  bool mustDivide = false;
99ef9eebSMatthias Springer  (void)mustDivide;
99ef9eebSMatthias Springer  VectorType superVectorType;
99ef9eebSMatthias Springer  if (auto transfer = dyn_cast<VectorTransferOpInterface>(op)) {
99ef9eebSMatthias Springer    superVectorType = transfer.getVectorType();
99ef9eebSMatthias Springer    mustDivide = true;
99ef9eebSMatthias Springer  } else if (op.getNumResults() == 0) {
23aa5a74SRiver Riddle    if (!isa<func::ReturnOp>(op)) {
99ef9eebSMatthias Springer      op.emitError("NYI: assuming only return operations can have 0 "
99ef9eebSMatthias Springer                   " results at this point");
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer    return false;
99ef9eebSMatthias Springer  } else if (op.getNumResults() == 1) {
99ef9eebSMatthias Springer    if (auto v = op.getResult(0).getType().dyn_cast<VectorType>()) {
99ef9eebSMatthias Springer      superVectorType = v;
99ef9eebSMatthias Springer    } else {
99ef9eebSMatthias Springer      // Not a vector type.
99ef9eebSMatthias Springer      return false;
99ef9eebSMatthias Springer    }
99ef9eebSMatthias Springer  } else {
99ef9eebSMatthias Springer    // Not a vector.transfer and has more than 1 result, fail hard for now to
99ef9eebSMatthias Springer    // wake us up when something changes.
99ef9eebSMatthias Springer    op.emitError("NYI: operation has more than 1 result");
99ef9eebSMatthias Springer    return false;
99ef9eebSMatthias Springer  }
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  // Get the ratio.
99ef9eebSMatthias Springer  auto ratio = shapeRatio(superVectorType, subVectorType);
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  // Sanity check.
5413bf1bSKazu Hirata  assert((ratio || !mustDivide) &&
99ef9eebSMatthias Springer         "vector.transfer operation in which super-vector size is not an"
99ef9eebSMatthias Springer         " integer multiple of sub-vector size");
99ef9eebSMatthias Springer
99ef9eebSMatthias Springer  // This catches cases that are not strictly necessary to have multiplicity but
99ef9eebSMatthias Springer  // still aren't divisible by the sub-vector shape.
99ef9eebSMatthias Springer  // This could be useful information if we wanted to reshape at the level of
99ef9eebSMatthias Springer  // the vector type (but we would have to look at the compute and distinguish
99ef9eebSMatthias Springer  // between parallel, reduction and possibly other cases.
*064a08cdSKazu Hirata  return ratio.has_value();
99ef9eebSMatthias Springer}