119459580SLuke Drummond //===-- x86ABIFixups.cpp ----------------------------------------*- C++ -*-===// 219459580SLuke Drummond // 319459580SLuke Drummond // The LLVM Compiler Infrastructure 419459580SLuke Drummond // 519459580SLuke Drummond // This file is distributed under the University of Illinois Open Source 619459580SLuke Drummond // License. See LICENSE.TXT for details. 719459580SLuke Drummond // 819459580SLuke Drummond //===----------------------------------------------------------------------===// 919459580SLuke Drummond 1019459580SLuke Drummond // C Includes 1119459580SLuke Drummond // C++ Includes 1219459580SLuke Drummond #include <set> 1319459580SLuke Drummond 1419459580SLuke Drummond // Other libraries and framework includes 1519459580SLuke Drummond #include "llvm/ADT/StringRef.h" 1619459580SLuke Drummond #include "llvm/IR/BasicBlock.h" 1719459580SLuke Drummond #include "llvm/IR/CallSite.h" 1819459580SLuke Drummond #include "llvm/IR/Constants.h" 1919459580SLuke Drummond #include "llvm/IR/Function.h" 2019459580SLuke Drummond #include "llvm/IR/Instruction.h" 2119459580SLuke Drummond #include "llvm/IR/Instructions.h" 2219459580SLuke Drummond #include "llvm/IR/Module.h" 2319459580SLuke Drummond #include "llvm/IRReader/IRReader.h" 2419459580SLuke Drummond #include "llvm/Pass.h" 2519459580SLuke Drummond 2619459580SLuke Drummond // Project includes 2719459580SLuke Drummond #include "lldb/Core/Log.h" 2819459580SLuke Drummond #include "lldb/Target/Process.h" 2919459580SLuke Drummond 3019459580SLuke Drummond using namespace lldb_private; 3119459580SLuke Drummond namespace 3219459580SLuke Drummond { 3319459580SLuke Drummond 3419459580SLuke Drummond bool 3519459580SLuke Drummond isRSAPICall(llvm::Module &module, llvm::CallInst *call_inst) 3619459580SLuke Drummond { 3719459580SLuke Drummond // TODO get the list of renderscript modules from lldb and check if 3819459580SLuke Drummond // this llvm::Module calls into any of them. 3919459580SLuke Drummond (void)module; 4019459580SLuke Drummond const auto func_name = call_inst->getCalledFunction()->getName(); 4119459580SLuke Drummond if (func_name.startswith("llvm") || func_name.startswith("lldb")) 4219459580SLuke Drummond return false; 4319459580SLuke Drummond 4419459580SLuke Drummond if (call_inst->getCalledFunction()->isIntrinsic()) 4519459580SLuke Drummond return false; 4619459580SLuke Drummond 4719459580SLuke Drummond return true; 4819459580SLuke Drummond } 4919459580SLuke Drummond 5019459580SLuke Drummond bool 5119459580SLuke Drummond isRSLargeReturnCall(llvm::Module &module, llvm::CallInst *call_inst) 5219459580SLuke Drummond { 5319459580SLuke Drummond // i686 and x86_64 returns for large vectors in the RenderScript API are not handled as normal 5419459580SLuke Drummond // register pairs, but as a hidden sret type. This is not reflected in the debug info or mangled 5519459580SLuke Drummond // symbol name, and the android ABI for x86 and x86_64, (as well as the emulators) specifies there is 5619459580SLuke Drummond // no AVX, so bcc generates an sret function because we cannot natively return 256 bit vectors. 5719459580SLuke Drummond // This function simply checks whether a function has a > 128bit return type. It is perhaps an 5819459580SLuke Drummond // unreliable heuristic, and relies on bcc not generating AVX code, so if the android ABI one day 5919459580SLuke Drummond // provides for AVX, this function may go out of fashion. 6019459580SLuke Drummond (void)module; 6119459580SLuke Drummond if (!call_inst || !call_inst->getCalledFunction()) 6219459580SLuke Drummond return false; 6319459580SLuke Drummond 6419459580SLuke Drummond return call_inst->getCalledFunction()->getReturnType()->getPrimitiveSizeInBits() > 128; 6519459580SLuke Drummond } 6619459580SLuke Drummond 6719459580SLuke Drummond bool 6819459580SLuke Drummond isRSAllocationPtrTy(const llvm::Type *type) 6919459580SLuke Drummond { 7019459580SLuke Drummond if (!type->isPointerTy()) 7119459580SLuke Drummond return false; 7219459580SLuke Drummond auto ptr_type = type->getPointerElementType(); 7319459580SLuke Drummond 7419459580SLuke Drummond return ptr_type->isStructTy() && ptr_type->getStructName().startswith("struct.rs_allocation"); 7519459580SLuke Drummond } 7619459580SLuke Drummond 7719459580SLuke Drummond bool 7819459580SLuke Drummond isRSAllocationTyCallSite(llvm::Module &module, llvm::CallInst *call_inst) 7919459580SLuke Drummond { 8019459580SLuke Drummond (void)module; 8119459580SLuke Drummond if (!call_inst->hasByValArgument()) 8219459580SLuke Drummond return false; 8319459580SLuke Drummond for (const auto ¶m : call_inst->operand_values()) 8419459580SLuke Drummond if (isRSAllocationPtrTy(param->getType())) 8519459580SLuke Drummond return true; 8619459580SLuke Drummond return false; 8719459580SLuke Drummond } 8819459580SLuke Drummond 8919459580SLuke Drummond llvm::FunctionType * 9019459580SLuke Drummond cloneToStructRetFnTy(llvm::CallInst *call_inst) 9119459580SLuke Drummond { 9219459580SLuke Drummond // on x86 StructReturn functions return a pointer to the return value, rather than the return 9319459580SLuke Drummond // value itself [ref](http://www.agner.org/optimize/calling_conventions.pdf section 6). 9419459580SLuke Drummond // We create a return type by getting the pointer type of the old return type, and inserting a new 9519459580SLuke Drummond // initial argument of pointer type of the original return type. 9619459580SLuke Drummond Log *log(GetLogIfAnyCategoriesSet(LIBLLDB_LOG_LANGUAGE | LIBLLDB_LOG_EXPRESSIONS)); 9719459580SLuke Drummond 9819459580SLuke Drummond assert(call_inst && "no CallInst"); 9919459580SLuke Drummond llvm::Function *orig = call_inst->getCalledFunction(); 10019459580SLuke Drummond assert(orig && "CallInst has no called function"); 10119459580SLuke Drummond llvm::FunctionType *orig_type = orig->getFunctionType(); 10219459580SLuke Drummond auto name = orig->getName(); 10319459580SLuke Drummond if (log) 10419459580SLuke Drummond log->Printf("%s - cloning to StructRet function for '%s'", __FUNCTION__, name.str().c_str()); 10519459580SLuke Drummond 10619459580SLuke Drummond unsigned num_params = orig_type->getNumParams(); 107*9d83de42SLuke Drummond std::vector<llvm::Type *> new_params{num_params + 1, nullptr}; 10819459580SLuke Drummond std::vector<llvm::Type *> params{orig_type->param_begin(), orig_type->param_end()}; 10919459580SLuke Drummond 11019459580SLuke Drummond // This may not work if the function is somehow declared void as llvm is strongly typed 11119459580SLuke Drummond // and represents void* with i8* 11219459580SLuke Drummond assert(!orig_type->getReturnType()->isVoidTy() && "Cannot add StructRet attribute to void function"); 11319459580SLuke Drummond llvm::PointerType *return_type_ptr_type = llvm::PointerType::getUnqual(orig->getReturnType()); 11419459580SLuke Drummond assert(return_type_ptr_type && "failed to get function return type PointerType"); 11519459580SLuke Drummond if (!return_type_ptr_type) 11619459580SLuke Drummond return nullptr; 11719459580SLuke Drummond 11819459580SLuke Drummond if (log) 11919459580SLuke Drummond log->Printf("%s - return type pointer type for StructRet clone @ '0x%p':\n", __FUNCTION__, 12019459580SLuke Drummond (void *)return_type_ptr_type); 12119459580SLuke Drummond // put the the sret pointer argument in place at the beginning of the argument list. 12219459580SLuke Drummond params.emplace(params.begin(), return_type_ptr_type); 12319459580SLuke Drummond assert(params.size() == num_params + 1); 12419459580SLuke Drummond return llvm::FunctionType::get(return_type_ptr_type, params, orig->isVarArg()); 12519459580SLuke Drummond } 12619459580SLuke Drummond 12719459580SLuke Drummond bool 12819459580SLuke Drummond findRSCallSites(llvm::Module &module, std::set<llvm::CallInst *> &rs_callsites, 12919459580SLuke Drummond bool (*predicate)(llvm::Module &, llvm::CallInst *)) 13019459580SLuke Drummond { 13119459580SLuke Drummond bool found = false; 13219459580SLuke Drummond 13319459580SLuke Drummond for (auto &func : module.getFunctionList()) 13419459580SLuke Drummond for (auto &block : func.getBasicBlockList()) 13519459580SLuke Drummond for (auto &inst : block) 13619459580SLuke Drummond { 13719459580SLuke Drummond llvm::CallInst *call_inst = llvm::dyn_cast_or_null<llvm::CallInst>(&inst); 13819459580SLuke Drummond if (!call_inst || !call_inst->getCalledFunction()) 13919459580SLuke Drummond // This is not the call-site you are looking for... 14019459580SLuke Drummond continue; 14119459580SLuke Drummond if (isRSAPICall(module, call_inst) && predicate(module, call_inst)) 14219459580SLuke Drummond { 14319459580SLuke Drummond rs_callsites.insert(call_inst); 14419459580SLuke Drummond found = true; 14519459580SLuke Drummond } 14619459580SLuke Drummond } 14719459580SLuke Drummond return found; 14819459580SLuke Drummond } 14919459580SLuke Drummond 15019459580SLuke Drummond bool 15119459580SLuke Drummond fixupX86StructRetCalls(llvm::Module &module) 15219459580SLuke Drummond { 15319459580SLuke Drummond bool changed = false; 15419459580SLuke Drummond // changing a basic block while iterating over it seems to have some undefined behaviour 15519459580SLuke Drummond // going on so we find all RS callsites first, then fix them up after consuming 15619459580SLuke Drummond // the iterator. 15719459580SLuke Drummond std::set<llvm::CallInst *> rs_callsites; 15819459580SLuke Drummond if (!findRSCallSites(module, rs_callsites, isRSLargeReturnCall)) 15919459580SLuke Drummond return false; 16019459580SLuke Drummond 16119459580SLuke Drummond for (auto call_inst : rs_callsites) 16219459580SLuke Drummond { 16319459580SLuke Drummond llvm::FunctionType *new_func_type = cloneToStructRetFnTy(call_inst); 16419459580SLuke Drummond assert(new_func_type && "failed to clone functionType for Renderscript ABI fixup"); 16519459580SLuke Drummond 16619459580SLuke Drummond llvm::CallSite call_site(call_inst); 16719459580SLuke Drummond llvm::Function *func = call_inst->getCalledFunction(); 16819459580SLuke Drummond assert(func && "cannot resolve function in RenderScriptRuntime"); 16919459580SLuke Drummond // Copy the original call arguments 17019459580SLuke Drummond std::vector<llvm::Value *> new_call_args(call_site.arg_begin(), call_site.arg_end()); 17119459580SLuke Drummond 17219459580SLuke Drummond // Allocate enough space to store the return value of the original function 17319459580SLuke Drummond // we pass a pointer to this allocation as the StructRet param, and then copy its 17419459580SLuke Drummond // value into the lldb return value 17519459580SLuke Drummond llvm::AllocaInst *return_value_alloc = 17619459580SLuke Drummond new llvm::AllocaInst(func->getReturnType(), "var_vector_return_alloc", call_inst); 17719459580SLuke Drummond // use the new allocation as the new first argument 17819459580SLuke Drummond new_call_args.emplace(new_call_args.begin(), llvm::cast<llvm::Value>(return_value_alloc)); 17919459580SLuke Drummond llvm::PointerType *new_func_ptr_type = llvm::PointerType::get(new_func_type, 0); 18019459580SLuke Drummond // Create the type cast from the old function type to the new one 18119459580SLuke Drummond llvm::Constant *new_func_cast = 18219459580SLuke Drummond llvm::ConstantExpr::getCast(llvm::Instruction::BitCast, func, new_func_ptr_type); 18319459580SLuke Drummond // create an allocation for a new function pointer 18419459580SLuke Drummond llvm::AllocaInst *new_func_ptr = new llvm::AllocaInst(new_func_ptr_type, "new_func_ptr", call_inst); 18519459580SLuke Drummond // store the new_func_cast to the newly allocated space 18619459580SLuke Drummond (void)new llvm::StoreInst(new_func_cast, new_func_ptr, "new_func_ptr_load_cast", call_inst); 18719459580SLuke Drummond // load the new function address ready for a jump 18819459580SLuke Drummond llvm::LoadInst *new_func_addr_load = new llvm::LoadInst(new_func_ptr, "load_func_pointer", call_inst); 18919459580SLuke Drummond // and create a callinstruction from it 19019459580SLuke Drummond llvm::CallInst *new_call_inst = 19119459580SLuke Drummond llvm::CallInst::Create(new_func_addr_load, new_call_args, "new_func_call", call_inst); 19219459580SLuke Drummond new_call_inst->setCallingConv(call_inst->getCallingConv()); 19319459580SLuke Drummond new_call_inst->setTailCall(call_inst->isTailCall()); 19419459580SLuke Drummond llvm::LoadInst *lldb_save_result_address = new llvm::LoadInst(return_value_alloc, "save_return_val", call_inst); 19519459580SLuke Drummond 19619459580SLuke Drummond // Now remove the old broken call 19719459580SLuke Drummond call_inst->replaceAllUsesWith(lldb_save_result_address); 19819459580SLuke Drummond call_inst->eraseFromParent(); 19919459580SLuke Drummond changed = true; 20019459580SLuke Drummond } 20119459580SLuke Drummond return changed; 20219459580SLuke Drummond } 20319459580SLuke Drummond 20419459580SLuke Drummond bool 20519459580SLuke Drummond fixupRSAllocationStructByValCalls(llvm::Module &module) 20619459580SLuke Drummond { 20719459580SLuke Drummond // On x86_64, calls to functions in the RS runtime that take an `rs_allocation` type argument 20819459580SLuke Drummond // are actually handled as by-ref params by bcc, but appear to be passed by value by lldb (the callsite all use 20919459580SLuke Drummond // `struct byval`). 21019459580SLuke Drummond // On x86_64 Linux, struct arguments are transferred in registers if the struct size is no bigger than 21119459580SLuke Drummond // 128bits [ref](http://www.agner.org/optimize/calling_conventions.pdf) section 7.1 "Passing and returning objects" 21219459580SLuke Drummond // otherwise passed on the stack. 21319459580SLuke Drummond // an object of type `rs_allocation` is actually 256bits, so should be passed on the stack. However, code generated 21419459580SLuke Drummond // by bcc actually treats formal params of type `rs_allocation` as `rs_allocation *` so we need to convert the 21519459580SLuke Drummond // calling convention to pass by reference, and remove any hint of byval from formal parameters. 21619459580SLuke Drummond bool changed = false; 21719459580SLuke Drummond std::set<llvm::CallInst *> rs_callsites; 21819459580SLuke Drummond if (!findRSCallSites(module, rs_callsites, isRSAllocationTyCallSite)) 21919459580SLuke Drummond return false; 22019459580SLuke Drummond 22119459580SLuke Drummond std::set<llvm::Function *> rs_functions; 22219459580SLuke Drummond 22319459580SLuke Drummond // for all call instructions 22419459580SLuke Drummond for (auto call_inst : rs_callsites) 22519459580SLuke Drummond { 22619459580SLuke Drummond // add the called function to a set so that we can strip its byval attributes in another pass 22719459580SLuke Drummond rs_functions.insert(call_inst->getCalledFunction()); 22819459580SLuke Drummond 22919459580SLuke Drummond // get the function attributes 23019459580SLuke Drummond llvm::AttributeSet call_attribs = call_inst->getAttributes(); 23119459580SLuke Drummond 23219459580SLuke Drummond // iterate over the argument attributes 23319459580SLuke Drummond for (size_t i = 1; i <= call_attribs.getNumSlots(); ++i) 23419459580SLuke Drummond { 23519459580SLuke Drummond // if this argument is passed by val 23619459580SLuke Drummond if (call_attribs.hasAttribute(i, llvm::Attribute::ByVal)) 23719459580SLuke Drummond { 23819459580SLuke Drummond // strip away the byval attribute 23919459580SLuke Drummond call_inst->removeAttribute(i, llvm::Attribute::get(module.getContext(), llvm::Attribute::ByVal)); 24019459580SLuke Drummond changed = true; 24119459580SLuke Drummond } 24219459580SLuke Drummond } 24319459580SLuke Drummond } 24419459580SLuke Drummond 24519459580SLuke Drummond llvm::AttributeSet attr_byval = llvm::AttributeSet::get(module.getContext(), 1u, llvm::Attribute::ByVal); 24619459580SLuke Drummond 24719459580SLuke Drummond // for all called function decls 24819459580SLuke Drummond for (auto func : rs_functions) 24919459580SLuke Drummond { 25019459580SLuke Drummond // inspect all of the arguments in the call 25119459580SLuke Drummond llvm::SymbolTableList<llvm::Argument> &argList = func->getArgumentList(); 25219459580SLuke Drummond for (auto &arg : argList) 25319459580SLuke Drummond { 25419459580SLuke Drummond if (arg.hasByValAttr()) 25519459580SLuke Drummond { 25619459580SLuke Drummond arg.removeAttr(attr_byval); 25719459580SLuke Drummond changed = true; 25819459580SLuke Drummond } 25919459580SLuke Drummond } 26019459580SLuke Drummond } 26119459580SLuke Drummond return changed; 26219459580SLuke Drummond } 26319459580SLuke Drummond } // end anonymous namespace 26419459580SLuke Drummond 26519459580SLuke Drummond namespace lldb_private 26619459580SLuke Drummond { 26719459580SLuke Drummond namespace lldb_renderscript 26819459580SLuke Drummond { 26919459580SLuke Drummond 27019459580SLuke Drummond bool 27119459580SLuke Drummond fixupX86FunctionCalls(llvm::Module &module) 27219459580SLuke Drummond { 27319459580SLuke Drummond return fixupX86StructRetCalls(module); 27419459580SLuke Drummond } 27519459580SLuke Drummond 27619459580SLuke Drummond bool 27719459580SLuke Drummond fixupX86_64FunctionCalls(llvm::Module &module) 27819459580SLuke Drummond { 27919459580SLuke Drummond bool changed = false; 28019459580SLuke Drummond changed |= fixupX86StructRetCalls(module); 28119459580SLuke Drummond changed |= fixupRSAllocationStructByValCalls(module); 28219459580SLuke Drummond return changed; 28319459580SLuke Drummond } 28419459580SLuke Drummond 28519459580SLuke Drummond } // end namespace lldb_renderscript 28619459580SLuke Drummond } // end namespace lldb_private 287