1 //===- ExecutionEngine.cpp - MLIR Execution engine and utils --------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file implements the execution engine for MLIR modules based on LLVM Orc 10 // JIT engine. 11 // 12 //===----------------------------------------------------------------------===// 13 #include "mlir/ExecutionEngine/ExecutionEngine.h" 14 #include "mlir/Dialect/LLVMIR/LLVMDialect.h" 15 #include "mlir/IR/BuiltinOps.h" 16 #include "mlir/Support/FileUtilities.h" 17 #include "mlir/Target/LLVMIR/Export.h" 18 19 #include "llvm/ExecutionEngine/JITEventListener.h" 20 #include "llvm/ExecutionEngine/ObjectCache.h" 21 #include "llvm/ExecutionEngine/Orc/CompileUtils.h" 22 #include "llvm/ExecutionEngine/Orc/ExecutionUtils.h" 23 #include "llvm/ExecutionEngine/Orc/IRCompileLayer.h" 24 #include "llvm/ExecutionEngine/Orc/IRTransformLayer.h" 25 #include "llvm/ExecutionEngine/Orc/JITTargetMachineBuilder.h" 26 #include "llvm/ExecutionEngine/Orc/RTDyldObjectLinkingLayer.h" 27 #include "llvm/ExecutionEngine/SectionMemoryManager.h" 28 #include "llvm/IR/IRBuilder.h" 29 #include "llvm/MC/SubtargetFeature.h" 30 #include "llvm/MC/TargetRegistry.h" 31 #include "llvm/Support/Debug.h" 32 #include "llvm/Support/Error.h" 33 #include "llvm/Support/Host.h" 34 #include "llvm/Support/ToolOutputFile.h" 35 36 #define DEBUG_TYPE "execution-engine" 37 38 using namespace mlir; 39 using llvm::dbgs; 40 using llvm::Error; 41 using llvm::errs; 42 using llvm::Expected; 43 using llvm::LLVMContext; 44 using llvm::MemoryBuffer; 45 using llvm::MemoryBufferRef; 46 using llvm::Module; 47 using llvm::SectionMemoryManager; 48 using llvm::StringError; 49 using llvm::Triple; 50 using llvm::orc::DynamicLibrarySearchGenerator; 51 using llvm::orc::ExecutionSession; 52 using llvm::orc::IRCompileLayer; 53 using llvm::orc::JITTargetMachineBuilder; 54 using llvm::orc::MangleAndInterner; 55 using llvm::orc::RTDyldObjectLinkingLayer; 56 using llvm::orc::SymbolMap; 57 using llvm::orc::ThreadSafeModule; 58 using llvm::orc::TMOwningSimpleCompiler; 59 60 /// Wrap a string into an llvm::StringError. 61 static Error makeStringError(const Twine &message) { 62 return llvm::make_error<StringError>(message.str(), 63 llvm::inconvertibleErrorCode()); 64 } 65 66 void SimpleObjectCache::notifyObjectCompiled(const Module *m, 67 MemoryBufferRef objBuffer) { 68 cachedObjects[m->getModuleIdentifier()] = MemoryBuffer::getMemBufferCopy( 69 objBuffer.getBuffer(), objBuffer.getBufferIdentifier()); 70 } 71 72 std::unique_ptr<MemoryBuffer> SimpleObjectCache::getObject(const Module *m) { 73 auto i = cachedObjects.find(m->getModuleIdentifier()); 74 if (i == cachedObjects.end()) { 75 LLVM_DEBUG(dbgs() << "No object for " << m->getModuleIdentifier() 76 << " in cache. Compiling.\n"); 77 return nullptr; 78 } 79 LLVM_DEBUG(dbgs() << "Object for " << m->getModuleIdentifier() 80 << " loaded from cache.\n"); 81 return MemoryBuffer::getMemBuffer(i->second->getMemBufferRef()); 82 } 83 84 void SimpleObjectCache::dumpToObjectFile(StringRef outputFilename) { 85 // Set up the output file. 86 std::string errorMessage; 87 auto file = openOutputFile(outputFilename, &errorMessage); 88 if (!file) { 89 llvm::errs() << errorMessage << "\n"; 90 return; 91 } 92 93 // Dump the object generated for a single module to the output file. 94 assert(cachedObjects.size() == 1 && "Expected only one object entry."); 95 auto &cachedObject = cachedObjects.begin()->second; 96 file->os() << cachedObject->getBuffer(); 97 file->keep(); 98 } 99 100 void ExecutionEngine::dumpToObjectFile(StringRef filename) { 101 cache->dumpToObjectFile(filename); 102 } 103 104 void ExecutionEngine::registerSymbols( 105 llvm::function_ref<SymbolMap(MangleAndInterner)> symbolMap) { 106 auto &mainJitDylib = jit->getMainJITDylib(); 107 cantFail(mainJitDylib.define( 108 absoluteSymbols(symbolMap(llvm::orc::MangleAndInterner( 109 mainJitDylib.getExecutionSession(), jit->getDataLayout()))))); 110 } 111 112 // Setup LLVM target triple from the current machine. 113 bool ExecutionEngine::setupTargetTriple(Module *llvmModule) { 114 // Setup the machine properties from the current architecture. 115 auto targetTriple = llvm::sys::getDefaultTargetTriple(); 116 std::string errorMessage; 117 const auto *target = 118 llvm::TargetRegistry::lookupTarget(targetTriple, errorMessage); 119 if (!target) { 120 errs() << "NO target: " << errorMessage << "\n"; 121 return true; 122 } 123 124 std::string cpu(llvm::sys::getHostCPUName()); 125 llvm::SubtargetFeatures features; 126 llvm::StringMap<bool> hostFeatures; 127 128 if (llvm::sys::getHostCPUFeatures(hostFeatures)) 129 for (auto &f : hostFeatures) 130 features.AddFeature(f.first(), f.second); 131 132 std::unique_ptr<llvm::TargetMachine> machine(target->createTargetMachine( 133 targetTriple, cpu, features.getString(), {}, {})); 134 if (!machine) { 135 errs() << "Unable to create target machine\n"; 136 return true; 137 } 138 llvmModule->setDataLayout(machine->createDataLayout()); 139 llvmModule->setTargetTriple(targetTriple); 140 return false; 141 } 142 143 static std::string makePackedFunctionName(StringRef name) { 144 return "_mlir_" + name.str(); 145 } 146 147 // For each function in the LLVM module, define an interface function that wraps 148 // all the arguments of the original function and all its results into an i8** 149 // pointer to provide a unified invocation interface. 150 static void packFunctionArguments(Module *module) { 151 auto &ctx = module->getContext(); 152 llvm::IRBuilder<> builder(ctx); 153 DenseSet<llvm::Function *> interfaceFunctions; 154 for (auto &func : module->getFunctionList()) { 155 if (func.isDeclaration()) { 156 continue; 157 } 158 if (interfaceFunctions.count(&func)) { 159 continue; 160 } 161 162 // Given a function `foo(<...>)`, define the interface function 163 // `mlir_foo(i8**)`. 164 auto *newType = llvm::FunctionType::get( 165 builder.getVoidTy(), builder.getInt8PtrTy()->getPointerTo(), 166 /*isVarArg=*/false); 167 auto newName = makePackedFunctionName(func.getName()); 168 auto funcCst = module->getOrInsertFunction(newName, newType); 169 llvm::Function *interfaceFunc = cast<llvm::Function>(funcCst.getCallee()); 170 interfaceFunctions.insert(interfaceFunc); 171 172 // Extract the arguments from the type-erased argument list and cast them to 173 // the proper types. 174 auto *bb = llvm::BasicBlock::Create(ctx); 175 bb->insertInto(interfaceFunc); 176 builder.SetInsertPoint(bb); 177 llvm::Value *argList = interfaceFunc->arg_begin(); 178 SmallVector<llvm::Value *, 8> args; 179 args.reserve(llvm::size(func.args())); 180 for (auto &indexedArg : llvm::enumerate(func.args())) { 181 llvm::Value *argIndex = llvm::Constant::getIntegerValue( 182 builder.getInt64Ty(), APInt(64, indexedArg.index())); 183 llvm::Value *argPtrPtr = 184 builder.CreateGEP(builder.getInt8PtrTy(), argList, argIndex); 185 llvm::Value *argPtr = 186 builder.CreateLoad(builder.getInt8PtrTy(), argPtrPtr); 187 llvm::Type *argTy = indexedArg.value().getType(); 188 argPtr = builder.CreateBitCast(argPtr, argTy->getPointerTo()); 189 llvm::Value *arg = builder.CreateLoad(argTy, argPtr); 190 args.push_back(arg); 191 } 192 193 // Call the implementation function with the extracted arguments. 194 llvm::Value *result = builder.CreateCall(&func, args); 195 196 // Assuming the result is one value, potentially of type `void`. 197 if (!result->getType()->isVoidTy()) { 198 llvm::Value *retIndex = llvm::Constant::getIntegerValue( 199 builder.getInt64Ty(), APInt(64, llvm::size(func.args()))); 200 llvm::Value *retPtrPtr = 201 builder.CreateGEP(builder.getInt8PtrTy(), argList, retIndex); 202 llvm::Value *retPtr = 203 builder.CreateLoad(builder.getInt8PtrTy(), retPtrPtr); 204 retPtr = builder.CreateBitCast(retPtr, result->getType()->getPointerTo()); 205 builder.CreateStore(result, retPtr); 206 } 207 208 // The interface function returns void. 209 builder.CreateRetVoid(); 210 } 211 } 212 213 ExecutionEngine::ExecutionEngine(bool enableObjectCache, 214 bool enableGDBNotificationListener, 215 bool enablePerfNotificationListener) 216 : cache(enableObjectCache ? new SimpleObjectCache() : nullptr), 217 gdbListener(enableGDBNotificationListener 218 ? llvm::JITEventListener::createGDBRegistrationListener() 219 : nullptr), 220 perfListener(nullptr) { 221 if (enablePerfNotificationListener) { 222 if (auto *listener = llvm::JITEventListener::createPerfJITEventListener()) 223 perfListener = listener; 224 else if (auto *listener = 225 llvm::JITEventListener::createIntelJITEventListener()) 226 perfListener = listener; 227 } 228 } 229 230 Expected<std::unique_ptr<ExecutionEngine>> ExecutionEngine::create( 231 ModuleOp m, 232 llvm::function_ref<std::unique_ptr<llvm::Module>(ModuleOp, 233 llvm::LLVMContext &)> 234 llvmModuleBuilder, 235 llvm::function_ref<Error(llvm::Module *)> transformer, 236 Optional<llvm::CodeGenOpt::Level> jitCodeGenOptLevel, 237 ArrayRef<StringRef> sharedLibPaths, bool enableObjectCache, 238 bool enableGDBNotificationListener, bool enablePerfNotificationListener) { 239 auto engine = std::make_unique<ExecutionEngine>( 240 enableObjectCache, enableGDBNotificationListener, 241 enablePerfNotificationListener); 242 243 std::unique_ptr<llvm::LLVMContext> ctx(new llvm::LLVMContext); 244 auto llvmModule = llvmModuleBuilder ? llvmModuleBuilder(m, *ctx) 245 : translateModuleToLLVMIR(m, *ctx); 246 if (!llvmModule) 247 return makeStringError("could not convert to LLVM IR"); 248 // FIXME: the triple should be passed to the translation or dialect conversion 249 // instead of this. Currently, the LLVM module created above has no triple 250 // associated with it. 251 setupTargetTriple(llvmModule.get()); 252 packFunctionArguments(llvmModule.get()); 253 254 auto dataLayout = llvmModule->getDataLayout(); 255 256 // Callback to create the object layer with symbol resolution to current 257 // process and dynamically linked libraries. 258 auto objectLinkingLayerCreator = [&](ExecutionSession &session, 259 const Triple &tt) { 260 auto objectLayer = std::make_unique<RTDyldObjectLinkingLayer>( 261 session, []() { return std::make_unique<SectionMemoryManager>(); }); 262 263 // Register JIT event listeners if they are enabled. 264 if (engine->gdbListener) 265 objectLayer->registerJITEventListener(*engine->gdbListener); 266 if (engine->perfListener) 267 objectLayer->registerJITEventListener(*engine->perfListener); 268 269 // COFF format binaries (Windows) need special handling to deal with 270 // exported symbol visibility. 271 // cf llvm/lib/ExecutionEngine/Orc/LLJIT.cpp LLJIT::createObjectLinkingLayer 272 llvm::Triple targetTriple(llvm::Twine(llvmModule->getTargetTriple())); 273 if (targetTriple.isOSBinFormatCOFF()) { 274 objectLayer->setOverrideObjectFlagsWithResponsibilityFlags(true); 275 objectLayer->setAutoClaimResponsibilityForObjectSymbols(true); 276 } 277 278 // Resolve symbols from shared libraries. 279 for (auto libPath : sharedLibPaths) { 280 auto mb = llvm::MemoryBuffer::getFile(libPath); 281 if (!mb) { 282 errs() << "Failed to create MemoryBuffer for: " << libPath 283 << "\nError: " << mb.getError().message() << "\n"; 284 continue; 285 } 286 auto &jd = session.createBareJITDylib(std::string(libPath)); 287 auto loaded = DynamicLibrarySearchGenerator::Load( 288 libPath.data(), dataLayout.getGlobalPrefix()); 289 if (!loaded) { 290 errs() << "Could not load " << libPath << ":\n " << loaded.takeError() 291 << "\n"; 292 continue; 293 } 294 jd.addGenerator(std::move(*loaded)); 295 cantFail(objectLayer->add(jd, std::move(mb.get()))); 296 } 297 298 return objectLayer; 299 }; 300 301 // Callback to inspect the cache and recompile on demand. This follows Lang's 302 // LLJITWithObjectCache example. 303 auto compileFunctionCreator = [&](JITTargetMachineBuilder jtmb) 304 -> Expected<std::unique_ptr<IRCompileLayer::IRCompiler>> { 305 if (jitCodeGenOptLevel) 306 jtmb.setCodeGenOptLevel(jitCodeGenOptLevel.getValue()); 307 auto tm = jtmb.createTargetMachine(); 308 if (!tm) 309 return tm.takeError(); 310 return std::make_unique<TMOwningSimpleCompiler>(std::move(*tm), 311 engine->cache.get()); 312 }; 313 314 // Create the LLJIT by calling the LLJITBuilder with 2 callbacks. 315 auto jit = 316 cantFail(llvm::orc::LLJITBuilder() 317 .setCompileFunctionCreator(compileFunctionCreator) 318 .setObjectLinkingLayerCreator(objectLinkingLayerCreator) 319 .create()); 320 321 // Add a ThreadSafemodule to the engine and return. 322 ThreadSafeModule tsm(std::move(llvmModule), std::move(ctx)); 323 if (transformer) 324 cantFail(tsm.withModuleDo( 325 [&](llvm::Module &module) { return transformer(&module); })); 326 cantFail(jit->addIRModule(std::move(tsm))); 327 engine->jit = std::move(jit); 328 329 // Resolve symbols that are statically linked in the current process. 330 llvm::orc::JITDylib &mainJD = engine->jit->getMainJITDylib(); 331 mainJD.addGenerator( 332 cantFail(DynamicLibrarySearchGenerator::GetForCurrentProcess( 333 dataLayout.getGlobalPrefix()))); 334 335 return std::move(engine); 336 } 337 338 Expected<void (*)(void **)> 339 ExecutionEngine::lookupPacked(StringRef name) const { 340 auto result = lookup(makePackedFunctionName(name)); 341 if (!result) 342 return result.takeError(); 343 return reinterpret_cast<void (*)(void **)>(result.get()); 344 } 345 346 Expected<void *> ExecutionEngine::lookup(StringRef name) const { 347 auto expectedSymbol = jit->lookup(name); 348 349 // JIT lookup may return an Error referring to strings stored internally by 350 // the JIT. If the Error outlives the ExecutionEngine, it would want have a 351 // dangling reference, which is currently caught by an assertion inside JIT 352 // thanks to hand-rolled reference counting. Rewrap the error message into a 353 // string before returning. Alternatively, ORC JIT should consider copying 354 // the string into the error message. 355 if (!expectedSymbol) { 356 std::string errorMessage; 357 llvm::raw_string_ostream os(errorMessage); 358 llvm::handleAllErrors(expectedSymbol.takeError(), 359 [&os](llvm::ErrorInfoBase &ei) { ei.log(os); }); 360 return makeStringError(os.str()); 361 } 362 363 auto rawFPtr = expectedSymbol->getAddress(); 364 auto *fptr = reinterpret_cast<void *>(rawFPtr); 365 if (!fptr) 366 return makeStringError("looked up function is null"); 367 return fptr; 368 } 369 370 Error ExecutionEngine::invokePacked(StringRef name, 371 MutableArrayRef<void *> args) { 372 auto expectedFPtr = lookupPacked(name); 373 if (!expectedFPtr) 374 return expectedFPtr.takeError(); 375 auto fptr = *expectedFPtr; 376 377 (*fptr)(args.data()); 378 379 return Error::success(); 380 } 381