//===- ByteCode.cpp - Pattern ByteCode Interpreter ------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file implements MLIR to byte-code generation and the interpreter. // //===----------------------------------------------------------------------===// #include "ByteCode.h" #include "mlir/Analysis/Liveness.h" #include "mlir/Dialect/PDL/IR/PDLTypes.h" #include "mlir/Dialect/PDLInterp/IR/PDLInterp.h" #include "mlir/IR/BuiltinOps.h" #include "mlir/IR/RegionGraphTraits.h" #include "llvm/ADT/IntervalMap.h" #include "llvm/ADT/PostOrderIterator.h" #include "llvm/ADT/TypeSwitch.h" #include "llvm/Support/Debug.h" #include "llvm/Support/Format.h" #include "llvm/Support/FormatVariadic.h" #include #define DEBUG_TYPE "pdl-bytecode" using namespace mlir; using namespace mlir::detail; //===----------------------------------------------------------------------===// // PDLByteCodePattern //===----------------------------------------------------------------------===// PDLByteCodePattern PDLByteCodePattern::create(pdl_interp::RecordMatchOp matchOp, ByteCodeAddr rewriterAddr) { SmallVector generatedOps; if (ArrayAttr generatedOpsAttr = matchOp.generatedOpsAttr()) generatedOps = llvm::to_vector<8>(generatedOpsAttr.getAsValueRange()); PatternBenefit benefit = matchOp.benefit(); MLIRContext *ctx = matchOp.getContext(); // Check to see if this is pattern matches a specific operation type. if (Optional rootKind = matchOp.rootKind()) return PDLByteCodePattern(rewriterAddr, *rootKind, benefit, ctx, generatedOps); return PDLByteCodePattern(rewriterAddr, MatchAnyOpTypeTag(), benefit, ctx, generatedOps); } //===----------------------------------------------------------------------===// // PDLByteCodeMutableState //===----------------------------------------------------------------------===// /// Set the new benefit for a bytecode pattern. The `patternIndex` corresponds /// to the position of the pattern within the range returned by /// `PDLByteCode::getPatterns`. void PDLByteCodeMutableState::updatePatternBenefit(unsigned patternIndex, PatternBenefit benefit) { currentPatternBenefits[patternIndex] = benefit; } /// Cleanup any allocated state after a full match/rewrite has been completed. /// This method should be called irregardless of whether the match+rewrite was a /// success or not. void PDLByteCodeMutableState::cleanupAfterMatchAndRewrite() { allocatedTypeRangeMemory.clear(); allocatedValueRangeMemory.clear(); } //===----------------------------------------------------------------------===// // Bytecode OpCodes //===----------------------------------------------------------------------===// namespace { enum OpCode : ByteCodeField { /// Apply an externally registered constraint. ApplyConstraint, /// Apply an externally registered rewrite. ApplyRewrite, /// Check if two generic values are equal. AreEqual, /// Check if two ranges are equal. AreRangesEqual, /// Unconditional branch. Branch, /// Compare the operand count of an operation with a constant. CheckOperandCount, /// Compare the name of an operation with a constant. CheckOperationName, /// Compare the result count of an operation with a constant. CheckResultCount, /// Compare a range of types to a constant range of types. CheckTypes, /// Continue to the next iteration of a loop. Continue, /// Create an operation. CreateOperation, /// Create a range of types. CreateTypes, /// Erase an operation. EraseOp, /// Extract the op from a range at the specified index. ExtractOp, /// Extract the type from a range at the specified index. ExtractType, /// Extract the value from a range at the specified index. ExtractValue, /// Terminate a matcher or rewrite sequence. Finalize, /// Iterate over a range of values. ForEach, /// Get a specific attribute of an operation. GetAttribute, /// Get the type of an attribute. GetAttributeType, /// Get the defining operation of a value. GetDefiningOp, /// Get a specific operand of an operation. GetOperand0, GetOperand1, GetOperand2, GetOperand3, GetOperandN, /// Get a specific operand group of an operation. GetOperands, /// Get a specific result of an operation. GetResult0, GetResult1, GetResult2, GetResult3, GetResultN, /// Get a specific result group of an operation. GetResults, /// Get the users of a value or a range of values. GetUsers, /// Get the type of a value. GetValueType, /// Get the types of a value range. GetValueRangeTypes, /// Check if a generic value is not null. IsNotNull, /// Record a successful pattern match. RecordMatch, /// Replace an operation. ReplaceOp, /// Compare an attribute with a set of constants. SwitchAttribute, /// Compare the operand count of an operation with a set of constants. SwitchOperandCount, /// Compare the name of an operation with a set of constants. SwitchOperationName, /// Compare the result count of an operation with a set of constants. SwitchResultCount, /// Compare a type with a set of constants. SwitchType, /// Compare a range of types with a set of constants. SwitchTypes, }; } // namespace //===----------------------------------------------------------------------===// // ByteCode Generation //===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===// // Generator namespace { struct ByteCodeLiveRange; struct ByteCodeWriter; /// Check if the given class `T` can be converted to an opaque pointer. template using has_pointer_traits = decltype(std::declval().getAsOpaquePointer()); /// This class represents the main generator for the pattern bytecode. class Generator { public: Generator(MLIRContext *ctx, std::vector &uniquedData, SmallVectorImpl &matcherByteCode, SmallVectorImpl &rewriterByteCode, SmallVectorImpl &patterns, ByteCodeField &maxValueMemoryIndex, ByteCodeField &maxOpRangeMemoryIndex, ByteCodeField &maxTypeRangeMemoryIndex, ByteCodeField &maxValueRangeMemoryIndex, ByteCodeField &maxLoopLevel, llvm::StringMap &constraintFns, llvm::StringMap &rewriteFns) : ctx(ctx), uniquedData(uniquedData), matcherByteCode(matcherByteCode), rewriterByteCode(rewriterByteCode), patterns(patterns), maxValueMemoryIndex(maxValueMemoryIndex), maxOpRangeMemoryIndex(maxOpRangeMemoryIndex), maxTypeRangeMemoryIndex(maxTypeRangeMemoryIndex), maxValueRangeMemoryIndex(maxValueRangeMemoryIndex), maxLoopLevel(maxLoopLevel) { for (auto it : llvm::enumerate(constraintFns)) constraintToMemIndex.try_emplace(it.value().first(), it.index()); for (auto it : llvm::enumerate(rewriteFns)) externalRewriterToMemIndex.try_emplace(it.value().first(), it.index()); } /// Generate the bytecode for the given PDL interpreter module. void generate(ModuleOp module); /// Return the memory index to use for the given value. ByteCodeField &getMemIndex(Value value) { assert(valueToMemIndex.count(value) && "expected memory index to be assigned"); return valueToMemIndex[value]; } /// Return the range memory index used to store the given range value. ByteCodeField &getRangeStorageIndex(Value value) { assert(valueToRangeIndex.count(value) && "expected range index to be assigned"); return valueToRangeIndex[value]; } /// Return an index to use when referring to the given data that is uniqued in /// the MLIR context. template std::enable_if_t::value, ByteCodeField &> getMemIndex(T val) { const void *opaqueVal = val.getAsOpaquePointer(); // Get or insert a reference to this value. auto it = uniquedDataToMemIndex.try_emplace( opaqueVal, maxValueMemoryIndex + uniquedData.size()); if (it.second) uniquedData.push_back(opaqueVal); return it.first->second; } private: /// Allocate memory indices for the results of operations within the matcher /// and rewriters. void allocateMemoryIndices(FuncOp matcherFunc, ModuleOp rewriterModule); /// Generate the bytecode for the given operation. void generate(Region *region, ByteCodeWriter &writer); void generate(Operation *op, ByteCodeWriter &writer); void generate(pdl_interp::ApplyConstraintOp op, ByteCodeWriter &writer); void generate(pdl_interp::ApplyRewriteOp op, ByteCodeWriter &writer); void generate(pdl_interp::AreEqualOp op, ByteCodeWriter &writer); void generate(pdl_interp::BranchOp op, ByteCodeWriter &writer); void generate(pdl_interp::CheckAttributeOp op, ByteCodeWriter &writer); void generate(pdl_interp::CheckOperandCountOp op, ByteCodeWriter &writer); void generate(pdl_interp::CheckOperationNameOp op, ByteCodeWriter &writer); void generate(pdl_interp::CheckResultCountOp op, ByteCodeWriter &writer); void generate(pdl_interp::CheckTypeOp op, ByteCodeWriter &writer); void generate(pdl_interp::CheckTypesOp op, ByteCodeWriter &writer); void generate(pdl_interp::ContinueOp op, ByteCodeWriter &writer); void generate(pdl_interp::CreateAttributeOp op, ByteCodeWriter &writer); void generate(pdl_interp::CreateOperationOp op, ByteCodeWriter &writer); void generate(pdl_interp::CreateTypeOp op, ByteCodeWriter &writer); void generate(pdl_interp::CreateTypesOp op, ByteCodeWriter &writer); void generate(pdl_interp::EraseOp op, ByteCodeWriter &writer); void generate(pdl_interp::ExtractOp op, ByteCodeWriter &writer); void generate(pdl_interp::FinalizeOp op, ByteCodeWriter &writer); void generate(pdl_interp::ForEachOp op, ByteCodeWriter &writer); void generate(pdl_interp::GetAttributeOp op, ByteCodeWriter &writer); void generate(pdl_interp::GetAttributeTypeOp op, ByteCodeWriter &writer); void generate(pdl_interp::GetDefiningOpOp op, ByteCodeWriter &writer); void generate(pdl_interp::GetOperandOp op, ByteCodeWriter &writer); void generate(pdl_interp::GetOperandsOp op, ByteCodeWriter &writer); void generate(pdl_interp::GetResultOp op, ByteCodeWriter &writer); void generate(pdl_interp::GetResultsOp op, ByteCodeWriter &writer); void generate(pdl_interp::GetUsersOp op, ByteCodeWriter &writer); void generate(pdl_interp::GetValueTypeOp op, ByteCodeWriter &writer); void generate(pdl_interp::InferredTypesOp op, ByteCodeWriter &writer); void generate(pdl_interp::IsNotNullOp op, ByteCodeWriter &writer); void generate(pdl_interp::RecordMatchOp op, ByteCodeWriter &writer); void generate(pdl_interp::ReplaceOp op, ByteCodeWriter &writer); void generate(pdl_interp::SwitchAttributeOp op, ByteCodeWriter &writer); void generate(pdl_interp::SwitchTypeOp op, ByteCodeWriter &writer); void generate(pdl_interp::SwitchTypesOp op, ByteCodeWriter &writer); void generate(pdl_interp::SwitchOperandCountOp op, ByteCodeWriter &writer); void generate(pdl_interp::SwitchOperationNameOp op, ByteCodeWriter &writer); void generate(pdl_interp::SwitchResultCountOp op, ByteCodeWriter &writer); /// Mapping from value to its corresponding memory index. DenseMap valueToMemIndex; /// Mapping from a range value to its corresponding range storage index. DenseMap valueToRangeIndex; /// Mapping from the name of an externally registered rewrite to its index in /// the bytecode registry. llvm::StringMap externalRewriterToMemIndex; /// Mapping from the name of an externally registered constraint to its index /// in the bytecode registry. llvm::StringMap constraintToMemIndex; /// Mapping from rewriter function name to the bytecode address of the /// rewriter function in byte. llvm::StringMap rewriterToAddr; /// Mapping from a uniqued storage object to its memory index within /// `uniquedData`. DenseMap uniquedDataToMemIndex; /// The current level of the foreach loop. ByteCodeField curLoopLevel = 0; /// The current MLIR context. MLIRContext *ctx; /// Mapping from block to its address. DenseMap blockToAddr; /// Data of the ByteCode class to be populated. std::vector &uniquedData; SmallVectorImpl &matcherByteCode; SmallVectorImpl &rewriterByteCode; SmallVectorImpl &patterns; ByteCodeField &maxValueMemoryIndex; ByteCodeField &maxOpRangeMemoryIndex; ByteCodeField &maxTypeRangeMemoryIndex; ByteCodeField &maxValueRangeMemoryIndex; ByteCodeField &maxLoopLevel; }; /// This class provides utilities for writing a bytecode stream. struct ByteCodeWriter { ByteCodeWriter(SmallVectorImpl &bytecode, Generator &generator) : bytecode(bytecode), generator(generator) {} /// Append a field to the bytecode. void append(ByteCodeField field) { bytecode.push_back(field); } void append(OpCode opCode) { bytecode.push_back(opCode); } /// Append an address to the bytecode. void append(ByteCodeAddr field) { static_assert((sizeof(ByteCodeAddr) / sizeof(ByteCodeField)) == 2, "unexpected ByteCode address size"); ByteCodeField fieldParts[2]; std::memcpy(fieldParts, &field, sizeof(ByteCodeAddr)); bytecode.append({fieldParts[0], fieldParts[1]}); } /// Append a single successor to the bytecode, the exact address will need to /// be resolved later. void append(Block *successor) { // Add back a reference to the successor so that the address can be resolved // later. unresolvedSuccessorRefs[successor].push_back(bytecode.size()); append(ByteCodeAddr(0)); } /// Append a successor range to the bytecode, the exact address will need to /// be resolved later. void append(SuccessorRange successors) { for (Block *successor : successors) append(successor); } /// Append a range of values that will be read as generic PDLValues. void appendPDLValueList(OperandRange values) { bytecode.push_back(values.size()); for (Value value : values) appendPDLValue(value); } /// Append a value as a PDLValue. void appendPDLValue(Value value) { appendPDLValueKind(value); append(value); } /// Append the PDLValue::Kind of the given value. void appendPDLValueKind(Value value) { appendPDLValueKind(value.getType()); } /// Append the PDLValue::Kind of the given type. void appendPDLValueKind(Type type) { PDLValue::Kind kind = TypeSwitch(type) .Case( [](Type) { return PDLValue::Kind::Attribute; }) .Case( [](Type) { return PDLValue::Kind::Operation; }) .Case([](pdl::RangeType rangeTy) { if (rangeTy.getElementType().isa()) return PDLValue::Kind::TypeRange; return PDLValue::Kind::ValueRange; }) .Case([](Type) { return PDLValue::Kind::Type; }) .Case([](Type) { return PDLValue::Kind::Value; }); bytecode.push_back(static_cast(kind)); } /// Append a value that will be stored in a memory slot and not inline within /// the bytecode. template std::enable_if_t::value || std::is_pointer::value> append(T value) { bytecode.push_back(generator.getMemIndex(value)); } /// Append a range of values. template > std::enable_if_t::value> append(T range) { bytecode.push_back(llvm::size(range)); for (auto it : range) append(it); } /// Append a variadic number of fields to the bytecode. template void append(FieldTy field, Field2Ty field2, FieldTys... fields) { append(field); append(field2, fields...); } /// Appends a value as a pointer, stored inline within the bytecode. template std::enable_if_t::value> appendInline(T value) { constexpr size_t numParts = sizeof(const void *) / sizeof(ByteCodeField); const void *pointer = value.getAsOpaquePointer(); ByteCodeField fieldParts[numParts]; std::memcpy(fieldParts, &pointer, sizeof(const void *)); bytecode.append(fieldParts, fieldParts + numParts); } /// Successor references in the bytecode that have yet to be resolved. DenseMap> unresolvedSuccessorRefs; /// The underlying bytecode buffer. SmallVectorImpl &bytecode; /// The main generator producing PDL. Generator &generator; }; /// This class represents a live range of PDL Interpreter values, containing /// information about when values are live within a match/rewrite. struct ByteCodeLiveRange { using Set = llvm::IntervalMap; using Allocator = Set::Allocator; ByteCodeLiveRange(Allocator &alloc) : liveness(new Set(alloc)) {} /// Union this live range with the one provided. void unionWith(const ByteCodeLiveRange &rhs) { for (auto it = rhs.liveness->begin(), e = rhs.liveness->end(); it != e; ++it) liveness->insert(it.start(), it.stop(), /*dummyValue*/ 0); } /// Returns true if this range overlaps with the one provided. bool overlaps(const ByteCodeLiveRange &rhs) const { return llvm::IntervalMapOverlaps(*liveness, *rhs.liveness) .valid(); } /// A map representing the ranges of the match/rewrite that a value is live in /// the interpreter. /// /// We use std::unique_ptr here, because IntervalMap does not provide a /// correct copy or move constructor. We can eliminate the pointer once /// https://reviews.llvm.org/D113240 lands. std::unique_ptr> liveness; /// The operation range storage index for this range. Optional opRangeIndex; /// The type range storage index for this range. Optional typeRangeIndex; /// The value range storage index for this range. Optional valueRangeIndex; }; } // namespace void Generator::generate(ModuleOp module) { FuncOp matcherFunc = module.lookupSymbol( pdl_interp::PDLInterpDialect::getMatcherFunctionName()); ModuleOp rewriterModule = module.lookupSymbol( pdl_interp::PDLInterpDialect::getRewriterModuleName()); assert(matcherFunc && rewriterModule && "invalid PDL Interpreter module"); // Allocate memory indices for the results of operations within the matcher // and rewriters. allocateMemoryIndices(matcherFunc, rewriterModule); // Generate code for the rewriter functions. ByteCodeWriter rewriterByteCodeWriter(rewriterByteCode, *this); for (FuncOp rewriterFunc : rewriterModule.getOps()) { rewriterToAddr.try_emplace(rewriterFunc.getName(), rewriterByteCode.size()); for (Operation &op : rewriterFunc.getOps()) generate(&op, rewriterByteCodeWriter); } assert(rewriterByteCodeWriter.unresolvedSuccessorRefs.empty() && "unexpected branches in rewriter function"); // Generate code for the matcher function. ByteCodeWriter matcherByteCodeWriter(matcherByteCode, *this); generate(&matcherFunc.getBody(), matcherByteCodeWriter); // Resolve successor references in the matcher. for (auto &it : matcherByteCodeWriter.unresolvedSuccessorRefs) { ByteCodeAddr addr = blockToAddr[it.first]; for (unsigned offsetToFix : it.second) std::memcpy(&matcherByteCode[offsetToFix], &addr, sizeof(ByteCodeAddr)); } } void Generator::allocateMemoryIndices(FuncOp matcherFunc, ModuleOp rewriterModule) { // Rewriters use simplistic allocation scheme that simply assigns an index to // each result. for (FuncOp rewriterFunc : rewriterModule.getOps()) { ByteCodeField index = 0, typeRangeIndex = 0, valueRangeIndex = 0; auto processRewriterValue = [&](Value val) { valueToMemIndex.try_emplace(val, index++); if (pdl::RangeType rangeType = val.getType().dyn_cast()) { Type elementTy = rangeType.getElementType(); if (elementTy.isa()) valueToRangeIndex.try_emplace(val, typeRangeIndex++); else if (elementTy.isa()) valueToRangeIndex.try_emplace(val, valueRangeIndex++); } }; for (BlockArgument arg : rewriterFunc.getArguments()) processRewriterValue(arg); rewriterFunc.getBody().walk([&](Operation *op) { for (Value result : op->getResults()) processRewriterValue(result); }); if (index > maxValueMemoryIndex) maxValueMemoryIndex = index; if (typeRangeIndex > maxTypeRangeMemoryIndex) maxTypeRangeMemoryIndex = typeRangeIndex; if (valueRangeIndex > maxValueRangeMemoryIndex) maxValueRangeMemoryIndex = valueRangeIndex; } // The matcher function uses a more sophisticated numbering that tries to // minimize the number of memory indices assigned. This is done by determining // a live range of the values within the matcher, then the allocation is just // finding the minimal number of overlapping live ranges. This is essentially // a simplified form of register allocation where we don't necessarily have a // limited number of registers, but we still want to minimize the number used. DenseMap opToIndex; matcherFunc.getBody().walk([&](Operation *op) { opToIndex.insert(std::make_pair(op, opToIndex.size())); }); // Liveness info for each of the defs within the matcher. ByteCodeLiveRange::Allocator allocator; DenseMap valueDefRanges; // Assign the root operation being matched to slot 0. BlockArgument rootOpArg = matcherFunc.getArgument(0); valueToMemIndex[rootOpArg] = 0; // Walk each of the blocks, computing the def interval that the value is used. Liveness matcherLiveness(matcherFunc); matcherFunc->walk([&](Block *block) { const LivenessBlockInfo *info = matcherLiveness.getLiveness(block); assert(info && "expected liveness info for block"); auto processValue = [&](Value value, Operation *firstUseOrDef) { // We don't need to process the root op argument, this value is always // assigned to the first memory slot. if (value == rootOpArg) return; // Set indices for the range of this block that the value is used. auto defRangeIt = valueDefRanges.try_emplace(value, allocator).first; defRangeIt->second.liveness->insert( opToIndex[firstUseOrDef], opToIndex[info->getEndOperation(value, firstUseOrDef)], /*dummyValue*/ 0); // Check to see if this value is a range type. if (auto rangeTy = value.getType().dyn_cast()) { Type eleType = rangeTy.getElementType(); if (eleType.isa()) defRangeIt->second.opRangeIndex = 0; else if (eleType.isa()) defRangeIt->second.typeRangeIndex = 0; else if (eleType.isa()) defRangeIt->second.valueRangeIndex = 0; } }; // Process the live-ins of this block. for (Value liveIn : info->in()) { // Only process the value if it has been defined in the current region. // Other values that span across pdl_interp.foreach will be added higher // up. This ensures that the we keep them alive for the entire duration // of the loop. if (liveIn.getParentRegion() == block->getParent()) processValue(liveIn, &block->front()); } // Process the block arguments for the entry block (those are not live-in). if (block->isEntryBlock()) { for (Value argument : block->getArguments()) processValue(argument, &block->front()); } // Process any new defs within this block. for (Operation &op : *block) for (Value result : op.getResults()) processValue(result, &op); }); // Greedily allocate memory slots using the computed def live ranges. std::vector allocatedIndices; // The number of memory indices currently allocated (and its next value). // Recall that the root gets allocated memory index 0. ByteCodeField numIndices = 1; // The number of memory ranges of various types (and their next values). ByteCodeField numOpRanges = 0, numTypeRanges = 0, numValueRanges = 0; for (auto &defIt : valueDefRanges) { ByteCodeField &memIndex = valueToMemIndex[defIt.first]; ByteCodeLiveRange &defRange = defIt.second; // Try to allocate to an existing index. for (auto existingIndexIt : llvm::enumerate(allocatedIndices)) { ByteCodeLiveRange &existingRange = existingIndexIt.value(); if (!defRange.overlaps(existingRange)) { existingRange.unionWith(defRange); memIndex = existingIndexIt.index() + 1; if (defRange.opRangeIndex) { if (!existingRange.opRangeIndex) existingRange.opRangeIndex = numOpRanges++; valueToRangeIndex[defIt.first] = *existingRange.opRangeIndex; } else if (defRange.typeRangeIndex) { if (!existingRange.typeRangeIndex) existingRange.typeRangeIndex = numTypeRanges++; valueToRangeIndex[defIt.first] = *existingRange.typeRangeIndex; } else if (defRange.valueRangeIndex) { if (!existingRange.valueRangeIndex) existingRange.valueRangeIndex = numValueRanges++; valueToRangeIndex[defIt.first] = *existingRange.valueRangeIndex; } break; } } // If no existing index could be used, add a new one. if (memIndex == 0) { allocatedIndices.emplace_back(allocator); ByteCodeLiveRange &newRange = allocatedIndices.back(); newRange.unionWith(defRange); // Allocate an index for op/type/value ranges. if (defRange.opRangeIndex) { newRange.opRangeIndex = numOpRanges; valueToRangeIndex[defIt.first] = numOpRanges++; } else if (defRange.typeRangeIndex) { newRange.typeRangeIndex = numTypeRanges; valueToRangeIndex[defIt.first] = numTypeRanges++; } else if (defRange.valueRangeIndex) { newRange.valueRangeIndex = numValueRanges; valueToRangeIndex[defIt.first] = numValueRanges++; } memIndex = allocatedIndices.size(); ++numIndices; } } // Print the index usage and ensure that we did not run out of index space. LLVM_DEBUG({ llvm::dbgs() << "Allocated " << allocatedIndices.size() << " indices " << "(down from initial " << valueDefRanges.size() << ").\n"; }); assert(allocatedIndices.size() <= std::numeric_limits::max() && "Ran out of memory for allocated indices"); // Update the max number of indices. if (numIndices > maxValueMemoryIndex) maxValueMemoryIndex = numIndices; if (numOpRanges > maxOpRangeMemoryIndex) maxOpRangeMemoryIndex = numOpRanges; if (numTypeRanges > maxTypeRangeMemoryIndex) maxTypeRangeMemoryIndex = numTypeRanges; if (numValueRanges > maxValueRangeMemoryIndex) maxValueRangeMemoryIndex = numValueRanges; } void Generator::generate(Region *region, ByteCodeWriter &writer) { llvm::ReversePostOrderTraversal rpot(region); for (Block *block : rpot) { // Keep track of where this block begins within the matcher function. blockToAddr.try_emplace(block, matcherByteCode.size()); for (Operation &op : *block) generate(&op, writer); } } void Generator::generate(Operation *op, ByteCodeWriter &writer) { LLVM_DEBUG({ // The following list must contain all the operations that do not // produce any bytecode. if (!isa(op)) writer.appendInline(op->getLoc()); }); TypeSwitch(op) .Case( [&](auto interpOp) { this->generate(interpOp, writer); }) .Default([](Operation *) { llvm_unreachable("unknown `pdl_interp` operation"); }); } void Generator::generate(pdl_interp::ApplyConstraintOp op, ByteCodeWriter &writer) { assert(constraintToMemIndex.count(op.name()) && "expected index for constraint function"); writer.append(OpCode::ApplyConstraint, constraintToMemIndex[op.name()], op.constParamsAttr()); writer.appendPDLValueList(op.args()); writer.append(op.getSuccessors()); } void Generator::generate(pdl_interp::ApplyRewriteOp op, ByteCodeWriter &writer) { assert(externalRewriterToMemIndex.count(op.name()) && "expected index for rewrite function"); writer.append(OpCode::ApplyRewrite, externalRewriterToMemIndex[op.name()], op.constParamsAttr()); writer.appendPDLValueList(op.args()); ResultRange results = op.results(); writer.append(ByteCodeField(results.size())); for (Value result : results) { // In debug mode we also record the expected kind of the result, so that we // can provide extra verification of the native rewrite function. #ifndef NDEBUG writer.appendPDLValueKind(result); #endif // Range results also need to append the range storage index. if (result.getType().isa()) writer.append(getRangeStorageIndex(result)); writer.append(result); } } void Generator::generate(pdl_interp::AreEqualOp op, ByteCodeWriter &writer) { Value lhs = op.lhs(); if (lhs.getType().isa()) { writer.append(OpCode::AreRangesEqual); writer.appendPDLValueKind(lhs); writer.append(op.lhs(), op.rhs(), op.getSuccessors()); return; } writer.append(OpCode::AreEqual, lhs, op.rhs(), op.getSuccessors()); } void Generator::generate(pdl_interp::BranchOp op, ByteCodeWriter &writer) { writer.append(OpCode::Branch, SuccessorRange(op.getOperation())); } void Generator::generate(pdl_interp::CheckAttributeOp op, ByteCodeWriter &writer) { writer.append(OpCode::AreEqual, op.attribute(), op.constantValue(), op.getSuccessors()); } void Generator::generate(pdl_interp::CheckOperandCountOp op, ByteCodeWriter &writer) { writer.append(OpCode::CheckOperandCount, op.operation(), op.count(), static_cast(op.compareAtLeast()), op.getSuccessors()); } void Generator::generate(pdl_interp::CheckOperationNameOp op, ByteCodeWriter &writer) { writer.append(OpCode::CheckOperationName, op.operation(), OperationName(op.name(), ctx), op.getSuccessors()); } void Generator::generate(pdl_interp::CheckResultCountOp op, ByteCodeWriter &writer) { writer.append(OpCode::CheckResultCount, op.operation(), op.count(), static_cast(op.compareAtLeast()), op.getSuccessors()); } void Generator::generate(pdl_interp::CheckTypeOp op, ByteCodeWriter &writer) { writer.append(OpCode::AreEqual, op.value(), op.type(), op.getSuccessors()); } void Generator::generate(pdl_interp::CheckTypesOp op, ByteCodeWriter &writer) { writer.append(OpCode::CheckTypes, op.value(), op.types(), op.getSuccessors()); } void Generator::generate(pdl_interp::ContinueOp op, ByteCodeWriter &writer) { assert(curLoopLevel > 0 && "encountered pdl_interp.continue at top level"); writer.append(OpCode::Continue, ByteCodeField(curLoopLevel - 1)); } void Generator::generate(pdl_interp::CreateAttributeOp op, ByteCodeWriter &writer) { // Simply repoint the memory index of the result to the constant. getMemIndex(op.attribute()) = getMemIndex(op.value()); } void Generator::generate(pdl_interp::CreateOperationOp op, ByteCodeWriter &writer) { writer.append(OpCode::CreateOperation, op.operation(), OperationName(op.name(), ctx)); writer.appendPDLValueList(op.operands()); // Add the attributes. OperandRange attributes = op.attributes(); writer.append(static_cast(attributes.size())); for (auto it : llvm::zip(op.attributeNames(), op.attributes())) writer.append(std::get<0>(it), std::get<1>(it)); writer.appendPDLValueList(op.types()); } void Generator::generate(pdl_interp::CreateTypeOp op, ByteCodeWriter &writer) { // Simply repoint the memory index of the result to the constant. getMemIndex(op.result()) = getMemIndex(op.value()); } void Generator::generate(pdl_interp::CreateTypesOp op, ByteCodeWriter &writer) { writer.append(OpCode::CreateTypes, op.result(), getRangeStorageIndex(op.result()), op.value()); } void Generator::generate(pdl_interp::EraseOp op, ByteCodeWriter &writer) { writer.append(OpCode::EraseOp, op.operation()); } void Generator::generate(pdl_interp::ExtractOp op, ByteCodeWriter &writer) { OpCode opCode = TypeSwitch(op.result().getType()) .Case([](pdl::OperationType) { return OpCode::ExtractOp; }) .Case([](pdl::ValueType) { return OpCode::ExtractValue; }) .Case([](pdl::TypeType) { return OpCode::ExtractType; }) .Default([](Type) -> OpCode { llvm_unreachable("unsupported element type"); }); writer.append(opCode, op.range(), op.index(), op.result()); } void Generator::generate(pdl_interp::FinalizeOp op, ByteCodeWriter &writer) { writer.append(OpCode::Finalize); } void Generator::generate(pdl_interp::ForEachOp op, ByteCodeWriter &writer) { BlockArgument arg = op.getLoopVariable(); writer.append(OpCode::ForEach, getRangeStorageIndex(op.values()), arg); writer.appendPDLValueKind(arg.getType()); writer.append(curLoopLevel, op.successor()); ++curLoopLevel; if (curLoopLevel > maxLoopLevel) maxLoopLevel = curLoopLevel; generate(&op.region(), writer); --curLoopLevel; } void Generator::generate(pdl_interp::GetAttributeOp op, ByteCodeWriter &writer) { writer.append(OpCode::GetAttribute, op.attribute(), op.operation(), op.nameAttr()); } void Generator::generate(pdl_interp::GetAttributeTypeOp op, ByteCodeWriter &writer) { writer.append(OpCode::GetAttributeType, op.result(), op.value()); } void Generator::generate(pdl_interp::GetDefiningOpOp op, ByteCodeWriter &writer) { writer.append(OpCode::GetDefiningOp, op.operation()); writer.appendPDLValue(op.value()); } void Generator::generate(pdl_interp::GetOperandOp op, ByteCodeWriter &writer) { uint32_t index = op.index(); if (index < 4) writer.append(static_cast(OpCode::GetOperand0 + index)); else writer.append(OpCode::GetOperandN, index); writer.append(op.operation(), op.value()); } void Generator::generate(pdl_interp::GetOperandsOp op, ByteCodeWriter &writer) { Value result = op.value(); Optional index = op.index(); writer.append(OpCode::GetOperands, index.getValueOr(std::numeric_limits::max()), op.operation()); if (result.getType().isa()) writer.append(getRangeStorageIndex(result)); else writer.append(std::numeric_limits::max()); writer.append(result); } void Generator::generate(pdl_interp::GetResultOp op, ByteCodeWriter &writer) { uint32_t index = op.index(); if (index < 4) writer.append(static_cast(OpCode::GetResult0 + index)); else writer.append(OpCode::GetResultN, index); writer.append(op.operation(), op.value()); } void Generator::generate(pdl_interp::GetResultsOp op, ByteCodeWriter &writer) { Value result = op.value(); Optional index = op.index(); writer.append(OpCode::GetResults, index.getValueOr(std::numeric_limits::max()), op.operation()); if (result.getType().isa()) writer.append(getRangeStorageIndex(result)); else writer.append(std::numeric_limits::max()); writer.append(result); } void Generator::generate(pdl_interp::GetUsersOp op, ByteCodeWriter &writer) { Value operations = op.operations(); ByteCodeField rangeIndex = getRangeStorageIndex(operations); writer.append(OpCode::GetUsers, operations, rangeIndex); writer.appendPDLValue(op.value()); } void Generator::generate(pdl_interp::GetValueTypeOp op, ByteCodeWriter &writer) { if (op.getType().isa()) { Value result = op.result(); writer.append(OpCode::GetValueRangeTypes, result, getRangeStorageIndex(result), op.value()); } else { writer.append(OpCode::GetValueType, op.result(), op.value()); } } void Generator::generate(pdl_interp::InferredTypesOp op, ByteCodeWriter &writer) { // InferType maps to a null type as a marker for inferring result types. getMemIndex(op.type()) = getMemIndex(Type()); } void Generator::generate(pdl_interp::IsNotNullOp op, ByteCodeWriter &writer) { writer.append(OpCode::IsNotNull, op.value(), op.getSuccessors()); } void Generator::generate(pdl_interp::RecordMatchOp op, ByteCodeWriter &writer) { ByteCodeField patternIndex = patterns.size(); patterns.emplace_back(PDLByteCodePattern::create( op, rewriterToAddr[op.rewriter().getLeafReference().getValue()])); writer.append(OpCode::RecordMatch, patternIndex, SuccessorRange(op.getOperation()), op.matchedOps()); writer.appendPDLValueList(op.inputs()); } void Generator::generate(pdl_interp::ReplaceOp op, ByteCodeWriter &writer) { writer.append(OpCode::ReplaceOp, op.operation()); writer.appendPDLValueList(op.replValues()); } void Generator::generate(pdl_interp::SwitchAttributeOp op, ByteCodeWriter &writer) { writer.append(OpCode::SwitchAttribute, op.attribute(), op.caseValuesAttr(), op.getSuccessors()); } void Generator::generate(pdl_interp::SwitchOperandCountOp op, ByteCodeWriter &writer) { writer.append(OpCode::SwitchOperandCount, op.operation(), op.caseValuesAttr(), op.getSuccessors()); } void Generator::generate(pdl_interp::SwitchOperationNameOp op, ByteCodeWriter &writer) { auto cases = llvm::map_range(op.caseValuesAttr(), [&](Attribute attr) { return OperationName(attr.cast().getValue(), ctx); }); writer.append(OpCode::SwitchOperationName, op.operation(), cases, op.getSuccessors()); } void Generator::generate(pdl_interp::SwitchResultCountOp op, ByteCodeWriter &writer) { writer.append(OpCode::SwitchResultCount, op.operation(), op.caseValuesAttr(), op.getSuccessors()); } void Generator::generate(pdl_interp::SwitchTypeOp op, ByteCodeWriter &writer) { writer.append(OpCode::SwitchType, op.value(), op.caseValuesAttr(), op.getSuccessors()); } void Generator::generate(pdl_interp::SwitchTypesOp op, ByteCodeWriter &writer) { writer.append(OpCode::SwitchTypes, op.value(), op.caseValuesAttr(), op.getSuccessors()); } //===----------------------------------------------------------------------===// // PDLByteCode //===----------------------------------------------------------------------===// PDLByteCode::PDLByteCode(ModuleOp module, llvm::StringMap constraintFns, llvm::StringMap rewriteFns) { Generator generator(module.getContext(), uniquedData, matcherByteCode, rewriterByteCode, patterns, maxValueMemoryIndex, maxOpRangeCount, maxTypeRangeCount, maxValueRangeCount, maxLoopLevel, constraintFns, rewriteFns); generator.generate(module); // Initialize the external functions. for (auto &it : constraintFns) constraintFunctions.push_back(std::move(it.second)); for (auto &it : rewriteFns) rewriteFunctions.push_back(std::move(it.second)); } /// Initialize the given state such that it can be used to execute the current /// bytecode. void PDLByteCode::initializeMutableState(PDLByteCodeMutableState &state) const { state.memory.resize(maxValueMemoryIndex, nullptr); state.opRangeMemory.resize(maxOpRangeCount); state.typeRangeMemory.resize(maxTypeRangeCount, TypeRange()); state.valueRangeMemory.resize(maxValueRangeCount, ValueRange()); state.loopIndex.resize(maxLoopLevel, 0); state.currentPatternBenefits.reserve(patterns.size()); for (const PDLByteCodePattern &pattern : patterns) state.currentPatternBenefits.push_back(pattern.getBenefit()); } //===----------------------------------------------------------------------===// // ByteCode Execution namespace { /// This class provides support for executing a bytecode stream. class ByteCodeExecutor { public: ByteCodeExecutor( const ByteCodeField *curCodeIt, MutableArrayRef memory, MutableArrayRef> opRangeMemory, MutableArrayRef typeRangeMemory, std::vector> &allocatedTypeRangeMemory, MutableArrayRef valueRangeMemory, std::vector> &allocatedValueRangeMemory, MutableArrayRef loopIndex, ArrayRef uniquedMemory, ArrayRef code, ArrayRef currentPatternBenefits, ArrayRef patterns, ArrayRef constraintFunctions, ArrayRef rewriteFunctions) : curCodeIt(curCodeIt), memory(memory), opRangeMemory(opRangeMemory), typeRangeMemory(typeRangeMemory), allocatedTypeRangeMemory(allocatedTypeRangeMemory), valueRangeMemory(valueRangeMemory), allocatedValueRangeMemory(allocatedValueRangeMemory), loopIndex(loopIndex), uniquedMemory(uniquedMemory), code(code), currentPatternBenefits(currentPatternBenefits), patterns(patterns), constraintFunctions(constraintFunctions), rewriteFunctions(rewriteFunctions) {} /// Start executing the code at the current bytecode index. `matches` is an /// optional field provided when this function is executed in a matching /// context. void execute(PatternRewriter &rewriter, SmallVectorImpl *matches = nullptr, Optional mainRewriteLoc = {}); private: /// Internal implementation of executing each of the bytecode commands. void executeApplyConstraint(PatternRewriter &rewriter); void executeApplyRewrite(PatternRewriter &rewriter); void executeAreEqual(); void executeAreRangesEqual(); void executeBranch(); void executeCheckOperandCount(); void executeCheckOperationName(); void executeCheckResultCount(); void executeCheckTypes(); void executeContinue(); void executeCreateOperation(PatternRewriter &rewriter, Location mainRewriteLoc); void executeCreateTypes(); void executeEraseOp(PatternRewriter &rewriter); template void executeExtract(); void executeFinalize(); void executeForEach(); void executeGetAttribute(); void executeGetAttributeType(); void executeGetDefiningOp(); void executeGetOperand(unsigned index); void executeGetOperands(); void executeGetResult(unsigned index); void executeGetResults(); void executeGetUsers(); void executeGetValueType(); void executeGetValueRangeTypes(); void executeIsNotNull(); void executeRecordMatch(PatternRewriter &rewriter, SmallVectorImpl &matches); void executeReplaceOp(PatternRewriter &rewriter); void executeSwitchAttribute(); void executeSwitchOperandCount(); void executeSwitchOperationName(); void executeSwitchResultCount(); void executeSwitchType(); void executeSwitchTypes(); /// Pushes a code iterator to the stack. void pushCodeIt(const ByteCodeField *it) { resumeCodeIt.push_back(it); } /// Pops a code iterator from the stack, returning true on success. void popCodeIt() { assert(!resumeCodeIt.empty() && "attempt to pop code off empty stack"); curCodeIt = resumeCodeIt.back(); resumeCodeIt.pop_back(); } /// Return the bytecode iterator at the start of the current op code. const ByteCodeField *getPrevCodeIt() const { LLVM_DEBUG({ // Account for the op code and the Location stored inline. return curCodeIt - 1 - sizeof(const void *) / sizeof(ByteCodeField); }); // Account for the op code only. return curCodeIt - 1; } /// Read a value from the bytecode buffer, optionally skipping a certain /// number of prefix values. These methods always update the buffer to point /// to the next field after the read data. template T read(size_t skipN = 0) { curCodeIt += skipN; return readImpl(); } ByteCodeField read(size_t skipN = 0) { return read(skipN); } /// Read a list of values from the bytecode buffer. template void readList(SmallVectorImpl &list) { list.clear(); for (unsigned i = 0, e = read(); i != e; ++i) list.push_back(read()); } /// Read a list of values from the bytecode buffer. The values may be encoded /// as either Value or ValueRange elements. void readValueList(SmallVectorImpl &list) { for (unsigned i = 0, e = read(); i != e; ++i) { if (read() == PDLValue::Kind::Value) { list.push_back(read()); } else { ValueRange *values = read(); list.append(values->begin(), values->end()); } } } /// Read a value stored inline as a pointer. template std::enable_if_t::value, T> readInline() { const void *pointer; std::memcpy(&pointer, curCodeIt, sizeof(const void *)); curCodeIt += sizeof(const void *) / sizeof(ByteCodeField); return T::getFromOpaquePointer(pointer); } /// Jump to a specific successor based on a predicate value. void selectJump(bool isTrue) { selectJump(size_t(isTrue ? 0 : 1)); } /// Jump to a specific successor based on a destination index. void selectJump(size_t destIndex) { curCodeIt = &code[read(destIndex * 2)]; } /// Handle a switch operation with the provided value and cases. template > void handleSwitch(const T &value, RangeT &&cases, Comparator cmp = {}) { LLVM_DEBUG({ llvm::dbgs() << " * Value: " << value << "\n" << " * Cases: "; llvm::interleaveComma(cases, llvm::dbgs()); llvm::dbgs() << "\n"; }); // Check to see if the attribute value is within the case list. Jump to // the correct successor index based on the result. for (auto it = cases.begin(), e = cases.end(); it != e; ++it) if (cmp(*it, value)) return selectJump(size_t((it - cases.begin()) + 1)); selectJump(size_t(0)); } /// Store a pointer to memory. void storeToMemory(unsigned index, const void *value) { memory[index] = value; } /// Store a value to memory as an opaque pointer. template std::enable_if_t::value> storeToMemory(unsigned index, T value) { memory[index] = value.getAsOpaquePointer(); } /// Internal implementation of reading various data types from the bytecode /// stream. template const void *readFromMemory() { size_t index = *curCodeIt++; // If this type is an SSA value, it can only be stored in non-const memory. if (llvm::is_one_of::value || index < memory.size()) return memory[index]; // Otherwise, if this index is not inbounds it is uniqued. return uniquedMemory[index - memory.size()]; } template std::enable_if_t::value, T> readImpl() { return reinterpret_cast(const_cast(readFromMemory())); } template std::enable_if_t::value && !std::is_same::value, T> readImpl() { return T(T::getFromOpaquePointer(readFromMemory())); } template std::enable_if_t::value, T> readImpl() { switch (read()) { case PDLValue::Kind::Attribute: return read(); case PDLValue::Kind::Operation: return read(); case PDLValue::Kind::Type: return read(); case PDLValue::Kind::Value: return read(); case PDLValue::Kind::TypeRange: return read(); case PDLValue::Kind::ValueRange: return read(); } llvm_unreachable("unhandled PDLValue::Kind"); } template std::enable_if_t::value, T> readImpl() { static_assert((sizeof(ByteCodeAddr) / sizeof(ByteCodeField)) == 2, "unexpected ByteCode address size"); ByteCodeAddr result; std::memcpy(&result, curCodeIt, sizeof(ByteCodeAddr)); curCodeIt += 2; return result; } template std::enable_if_t::value, T> readImpl() { return *curCodeIt++; } template std::enable_if_t::value, T> readImpl() { return static_cast(readImpl()); } /// The underlying bytecode buffer. const ByteCodeField *curCodeIt; /// The stack of bytecode positions at which to resume operation. SmallVector resumeCodeIt; /// The current execution memory. MutableArrayRef memory; MutableArrayRef opRangeMemory; MutableArrayRef typeRangeMemory; std::vector> &allocatedTypeRangeMemory; MutableArrayRef valueRangeMemory; std::vector> &allocatedValueRangeMemory; /// The current loop indices. MutableArrayRef loopIndex; /// References to ByteCode data necessary for execution. ArrayRef uniquedMemory; ArrayRef code; ArrayRef currentPatternBenefits; ArrayRef patterns; ArrayRef constraintFunctions; ArrayRef rewriteFunctions; }; /// This class is an instantiation of the PDLResultList that provides access to /// the returned results. This API is not on `PDLResultList` to avoid /// overexposing access to information specific solely to the ByteCode. class ByteCodeRewriteResultList : public PDLResultList { public: ByteCodeRewriteResultList(unsigned maxNumResults) : PDLResultList(maxNumResults) {} /// Return the list of PDL results. MutableArrayRef getResults() { return results; } /// Return the type ranges allocated by this list. MutableArrayRef> getAllocatedTypeRanges() { return allocatedTypeRanges; } /// Return the value ranges allocated by this list. MutableArrayRef> getAllocatedValueRanges() { return allocatedValueRanges; } }; } // namespace void ByteCodeExecutor::executeApplyConstraint(PatternRewriter &rewriter) { LLVM_DEBUG(llvm::dbgs() << "Executing ApplyConstraint:\n"); const PDLConstraintFunction &constraintFn = constraintFunctions[read()]; ArrayAttr constParams = read(); SmallVector args; readList(args); LLVM_DEBUG({ llvm::dbgs() << " * Arguments: "; llvm::interleaveComma(args, llvm::dbgs()); llvm::dbgs() << "\n * Parameters: " << constParams << "\n"; }); // Invoke the constraint and jump to the proper destination. selectJump(succeeded(constraintFn(args, constParams, rewriter))); } void ByteCodeExecutor::executeApplyRewrite(PatternRewriter &rewriter) { LLVM_DEBUG(llvm::dbgs() << "Executing ApplyRewrite:\n"); const PDLRewriteFunction &rewriteFn = rewriteFunctions[read()]; ArrayAttr constParams = read(); SmallVector args; readList(args); LLVM_DEBUG({ llvm::dbgs() << " * Arguments: "; llvm::interleaveComma(args, llvm::dbgs()); llvm::dbgs() << "\n * Parameters: " << constParams << "\n"; }); // Execute the rewrite function. ByteCodeField numResults = read(); ByteCodeRewriteResultList results(numResults); rewriteFn(args, constParams, rewriter, results); assert(results.getResults().size() == numResults && "native PDL rewrite function returned unexpected number of results"); // Store the results in the bytecode memory. for (PDLValue &result : results.getResults()) { LLVM_DEBUG(llvm::dbgs() << " * Result: " << result << "\n"); // In debug mode we also verify the expected kind of the result. #ifndef NDEBUG assert(result.getKind() == read() && "native PDL rewrite function returned an unexpected type of result"); #endif // If the result is a range, we need to copy it over to the bytecodes // range memory. if (Optional typeRange = result.dyn_cast()) { unsigned rangeIndex = read(); typeRangeMemory[rangeIndex] = *typeRange; memory[read()] = &typeRangeMemory[rangeIndex]; } else if (Optional valueRange = result.dyn_cast()) { unsigned rangeIndex = read(); valueRangeMemory[rangeIndex] = *valueRange; memory[read()] = &valueRangeMemory[rangeIndex]; } else { memory[read()] = result.getAsOpaquePointer(); } } // Copy over any underlying storage allocated for result ranges. for (auto &it : results.getAllocatedTypeRanges()) allocatedTypeRangeMemory.push_back(std::move(it)); for (auto &it : results.getAllocatedValueRanges()) allocatedValueRangeMemory.push_back(std::move(it)); } void ByteCodeExecutor::executeAreEqual() { LLVM_DEBUG(llvm::dbgs() << "Executing AreEqual:\n"); const void *lhs = read(); const void *rhs = read(); LLVM_DEBUG(llvm::dbgs() << " * " << lhs << " == " << rhs << "\n"); selectJump(lhs == rhs); } void ByteCodeExecutor::executeAreRangesEqual() { LLVM_DEBUG(llvm::dbgs() << "Executing AreRangesEqual:\n"); PDLValue::Kind valueKind = read(); const void *lhs = read(); const void *rhs = read(); switch (valueKind) { case PDLValue::Kind::TypeRange: { const TypeRange *lhsRange = reinterpret_cast(lhs); const TypeRange *rhsRange = reinterpret_cast(rhs); LLVM_DEBUG(llvm::dbgs() << " * " << lhs << " == " << rhs << "\n\n"); selectJump(*lhsRange == *rhsRange); break; } case PDLValue::Kind::ValueRange: { const auto *lhsRange = reinterpret_cast(lhs); const auto *rhsRange = reinterpret_cast(rhs); LLVM_DEBUG(llvm::dbgs() << " * " << lhs << " == " << rhs << "\n\n"); selectJump(*lhsRange == *rhsRange); break; } default: llvm_unreachable("unexpected `AreRangesEqual` value kind"); } } void ByteCodeExecutor::executeBranch() { LLVM_DEBUG(llvm::dbgs() << "Executing Branch\n"); curCodeIt = &code[read()]; } void ByteCodeExecutor::executeCheckOperandCount() { LLVM_DEBUG(llvm::dbgs() << "Executing CheckOperandCount:\n"); Operation *op = read(); uint32_t expectedCount = read(); bool compareAtLeast = read(); LLVM_DEBUG(llvm::dbgs() << " * Found: " << op->getNumOperands() << "\n" << " * Expected: " << expectedCount << "\n" << " * Comparator: " << (compareAtLeast ? ">=" : "==") << "\n"); if (compareAtLeast) selectJump(op->getNumOperands() >= expectedCount); else selectJump(op->getNumOperands() == expectedCount); } void ByteCodeExecutor::executeCheckOperationName() { LLVM_DEBUG(llvm::dbgs() << "Executing CheckOperationName:\n"); Operation *op = read(); OperationName expectedName = read(); LLVM_DEBUG(llvm::dbgs() << " * Found: \"" << op->getName() << "\"\n" << " * Expected: \"" << expectedName << "\"\n"); selectJump(op->getName() == expectedName); } void ByteCodeExecutor::executeCheckResultCount() { LLVM_DEBUG(llvm::dbgs() << "Executing CheckResultCount:\n"); Operation *op = read(); uint32_t expectedCount = read(); bool compareAtLeast = read(); LLVM_DEBUG(llvm::dbgs() << " * Found: " << op->getNumResults() << "\n" << " * Expected: " << expectedCount << "\n" << " * Comparator: " << (compareAtLeast ? ">=" : "==") << "\n"); if (compareAtLeast) selectJump(op->getNumResults() >= expectedCount); else selectJump(op->getNumResults() == expectedCount); } void ByteCodeExecutor::executeCheckTypes() { LLVM_DEBUG(llvm::dbgs() << "Executing AreEqual:\n"); TypeRange *lhs = read(); Attribute rhs = read(); LLVM_DEBUG(llvm::dbgs() << " * " << lhs << " == " << rhs << "\n\n"); selectJump(*lhs == rhs.cast().getAsValueRange()); } void ByteCodeExecutor::executeContinue() { ByteCodeField level = read(); LLVM_DEBUG(llvm::dbgs() << "Executing Continue\n" << " * Level: " << level << "\n"); ++loopIndex[level]; popCodeIt(); } void ByteCodeExecutor::executeCreateTypes() { LLVM_DEBUG(llvm::dbgs() << "Executing CreateTypes:\n"); unsigned memIndex = read(); unsigned rangeIndex = read(); ArrayAttr typesAttr = read().cast(); LLVM_DEBUG(llvm::dbgs() << " * Types: " << typesAttr << "\n\n"); // Allocate a buffer for this type range. llvm::OwningArrayRef storage(typesAttr.size()); llvm::copy(typesAttr.getAsValueRange(), storage.begin()); allocatedTypeRangeMemory.emplace_back(std::move(storage)); // Assign this to the range slot and use the range as the value for the // memory index. typeRangeMemory[rangeIndex] = allocatedTypeRangeMemory.back(); memory[memIndex] = &typeRangeMemory[rangeIndex]; } void ByteCodeExecutor::executeCreateOperation(PatternRewriter &rewriter, Location mainRewriteLoc) { LLVM_DEBUG(llvm::dbgs() << "Executing CreateOperation:\n"); unsigned memIndex = read(); OperationState state(mainRewriteLoc, read()); readValueList(state.operands); for (unsigned i = 0, e = read(); i != e; ++i) { StringAttr name = read(); if (Attribute attr = read()) state.addAttribute(name, attr); } for (unsigned i = 0, e = read(); i != e; ++i) { if (read() == PDLValue::Kind::Type) { state.types.push_back(read()); continue; } // If we find a null range, this signals that the types are infered. if (TypeRange *resultTypes = read()) { state.types.append(resultTypes->begin(), resultTypes->end()); continue; } // Handle the case where the operation has inferred types. InferTypeOpInterface::Concept *concept = state.name.getRegisteredInfo()->getInterface(); // TODO: Handle failure. state.types.clear(); if (failed(concept->inferReturnTypes( state.getContext(), state.location, state.operands, state.attributes.getDictionary(state.getContext()), state.regions, state.types))) return; break; } Operation *resultOp = rewriter.createOperation(state); memory[memIndex] = resultOp; LLVM_DEBUG({ llvm::dbgs() << " * Attributes: " << state.attributes.getDictionary(state.getContext()) << "\n * Operands: "; llvm::interleaveComma(state.operands, llvm::dbgs()); llvm::dbgs() << "\n * Result Types: "; llvm::interleaveComma(state.types, llvm::dbgs()); llvm::dbgs() << "\n * Result: " << *resultOp << "\n"; }); } void ByteCodeExecutor::executeEraseOp(PatternRewriter &rewriter) { LLVM_DEBUG(llvm::dbgs() << "Executing EraseOp:\n"); Operation *op = read(); LLVM_DEBUG(llvm::dbgs() << " * Operation: " << *op << "\n"); rewriter.eraseOp(op); } template void ByteCodeExecutor::executeExtract() { LLVM_DEBUG(llvm::dbgs() << "Executing Extract" << kind << ":\n"); Range *range = read(); unsigned index = read(); unsigned memIndex = read(); if (!range) { memory[memIndex] = nullptr; return; } T result = index < range->size() ? (*range)[index] : T(); LLVM_DEBUG(llvm::dbgs() << " * " << kind << "s(" << range->size() << ")\n" << " * Index: " << index << "\n" << " * Result: " << result << "\n"); storeToMemory(memIndex, result); } void ByteCodeExecutor::executeFinalize() { LLVM_DEBUG(llvm::dbgs() << "Executing Finalize\n"); } void ByteCodeExecutor::executeForEach() { LLVM_DEBUG(llvm::dbgs() << "Executing ForEach:\n"); const ByteCodeField *prevCodeIt = getPrevCodeIt(); unsigned rangeIndex = read(); unsigned memIndex = read(); const void *value = nullptr; switch (read()) { case PDLValue::Kind::Operation: { unsigned &index = loopIndex[read()]; ArrayRef array = opRangeMemory[rangeIndex]; assert(index <= array.size() && "iterated past the end"); if (index < array.size()) { LLVM_DEBUG(llvm::dbgs() << " * Result: " << array[index] << "\n"); value = array[index]; break; } LLVM_DEBUG(llvm::dbgs() << " * Done\n"); index = 0; selectJump(size_t(0)); return; } default: llvm_unreachable("unexpected `ForEach` value kind"); } // Store the iterate value and the stack address. memory[memIndex] = value; pushCodeIt(prevCodeIt); // Skip over the successor (we will enter the body of the loop). read(); } void ByteCodeExecutor::executeGetAttribute() { LLVM_DEBUG(llvm::dbgs() << "Executing GetAttribute:\n"); unsigned memIndex = read(); Operation *op = read(); StringAttr attrName = read(); Attribute attr = op->getAttr(attrName); LLVM_DEBUG(llvm::dbgs() << " * Operation: " << *op << "\n" << " * Attribute: " << attrName << "\n" << " * Result: " << attr << "\n"); memory[memIndex] = attr.getAsOpaquePointer(); } void ByteCodeExecutor::executeGetAttributeType() { LLVM_DEBUG(llvm::dbgs() << "Executing GetAttributeType:\n"); unsigned memIndex = read(); Attribute attr = read(); Type type = attr ? attr.getType() : Type(); LLVM_DEBUG(llvm::dbgs() << " * Attribute: " << attr << "\n" << " * Result: " << type << "\n"); memory[memIndex] = type.getAsOpaquePointer(); } void ByteCodeExecutor::executeGetDefiningOp() { LLVM_DEBUG(llvm::dbgs() << "Executing GetDefiningOp:\n"); unsigned memIndex = read(); Operation *op = nullptr; if (read() == PDLValue::Kind::Value) { Value value = read(); if (value) op = value.getDefiningOp(); LLVM_DEBUG(llvm::dbgs() << " * Value: " << value << "\n"); } else { ValueRange *values = read(); if (values && !values->empty()) { op = values->front().getDefiningOp(); } LLVM_DEBUG(llvm::dbgs() << " * Values: " << values << "\n"); } LLVM_DEBUG(llvm::dbgs() << " * Result: " << op << "\n"); memory[memIndex] = op; } void ByteCodeExecutor::executeGetOperand(unsigned index) { Operation *op = read(); unsigned memIndex = read(); Value operand = index < op->getNumOperands() ? op->getOperand(index) : Value(); LLVM_DEBUG(llvm::dbgs() << " * Operation: " << *op << "\n" << " * Index: " << index << "\n" << " * Result: " << operand << "\n"); memory[memIndex] = operand.getAsOpaquePointer(); } /// This function is the internal implementation of `GetResults` and /// `GetOperands` that provides support for extracting a value range from the /// given operation. template