1696bd635SAlexander Shaposhnikov //===-- RenderScriptx86ABIFixups.cpp ----------------------------*- C++ -*-===//
219459580SLuke Drummond //
319459580SLuke Drummond //                     The LLVM Compiler Infrastructure
419459580SLuke Drummond //
519459580SLuke Drummond // This file is distributed under the University of Illinois Open Source
619459580SLuke Drummond // License. See LICENSE.TXT for details.
719459580SLuke Drummond //
819459580SLuke Drummond //===----------------------------------------------------------------------===//
919459580SLuke Drummond 
1019459580SLuke Drummond // C Includes
1119459580SLuke Drummond // C++ Includes
1219459580SLuke Drummond #include <set>
1319459580SLuke Drummond 
1419459580SLuke Drummond // Other libraries and framework includes
1519459580SLuke Drummond #include "llvm/ADT/StringRef.h"
1619459580SLuke Drummond #include "llvm/IR/BasicBlock.h"
1719459580SLuke Drummond #include "llvm/IR/CallSite.h"
1819459580SLuke Drummond #include "llvm/IR/Constants.h"
1919459580SLuke Drummond #include "llvm/IR/Function.h"
2019459580SLuke Drummond #include "llvm/IR/Instruction.h"
2119459580SLuke Drummond #include "llvm/IR/Instructions.h"
2219459580SLuke Drummond #include "llvm/IR/Module.h"
2319459580SLuke Drummond #include "llvm/IRReader/IRReader.h"
2419459580SLuke Drummond #include "llvm/Pass.h"
2519459580SLuke Drummond 
2619459580SLuke Drummond // Project includes
2719459580SLuke Drummond #include "lldb/Target/Process.h"
286f9e6901SZachary Turner #include "lldb/Utility/Log.h"
2919459580SLuke Drummond 
3019459580SLuke Drummond using namespace lldb_private;
31b9c1b51eSKate Stone namespace {
3219459580SLuke Drummond 
33b9c1b51eSKate Stone bool isRSAPICall(llvm::Module &module, llvm::CallInst *call_inst) {
3419459580SLuke Drummond   // TODO get the list of renderscript modules from lldb and check if
3519459580SLuke Drummond   // this llvm::Module calls into any of them.
3619459580SLuke Drummond   (void)module;
3719459580SLuke Drummond   const auto func_name = call_inst->getCalledFunction()->getName();
3819459580SLuke Drummond   if (func_name.startswith("llvm") || func_name.startswith("lldb"))
3919459580SLuke Drummond     return false;
4019459580SLuke Drummond 
4119459580SLuke Drummond   if (call_inst->getCalledFunction()->isIntrinsic())
4219459580SLuke Drummond     return false;
4319459580SLuke Drummond 
4419459580SLuke Drummond   return true;
4519459580SLuke Drummond }
4619459580SLuke Drummond 
47b9c1b51eSKate Stone bool isRSLargeReturnCall(llvm::Module &module, llvm::CallInst *call_inst) {
48b9c1b51eSKate Stone   // i686 and x86_64 returns for large vectors in the RenderScript API are not
4905097246SAdrian Prantl   // handled as normal register pairs, but as a hidden sret type. This is not
5005097246SAdrian Prantl   // reflected in the debug info or mangled symbol name, and the android ABI
5105097246SAdrian Prantl   // for x86 and x86_64, (as well as the emulators) specifies there is no AVX,
5205097246SAdrian Prantl   // so bcc generates an sret function because we cannot natively return
53b9c1b51eSKate Stone   // 256 bit vectors.
54b9c1b51eSKate Stone   // This function simply checks whether a function has a > 128bit return type.
5505097246SAdrian Prantl   // It is perhaps an unreliable heuristic, and relies on bcc not generating
5605097246SAdrian Prantl   // AVX code, so if the android ABI one day provides for AVX, this function
5705097246SAdrian Prantl   // may go out of fashion.
5819459580SLuke Drummond   (void)module;
5919459580SLuke Drummond   if (!call_inst || !call_inst->getCalledFunction())
6019459580SLuke Drummond     return false;
6119459580SLuke Drummond 
62b9c1b51eSKate Stone   return call_inst->getCalledFunction()
63b9c1b51eSKate Stone              ->getReturnType()
64b9c1b51eSKate Stone              ->getPrimitiveSizeInBits() > 128;
6519459580SLuke Drummond }
6619459580SLuke Drummond 
67b9c1b51eSKate Stone bool isRSAllocationPtrTy(const llvm::Type *type) {
6819459580SLuke Drummond   if (!type->isPointerTy())
6919459580SLuke Drummond     return false;
7019459580SLuke Drummond   auto ptr_type = type->getPointerElementType();
7119459580SLuke Drummond 
72b9c1b51eSKate Stone   return ptr_type->isStructTy() &&
73b9c1b51eSKate Stone          ptr_type->getStructName().startswith("struct.rs_allocation");
7419459580SLuke Drummond }
7519459580SLuke Drummond 
76b9c1b51eSKate Stone bool isRSAllocationTyCallSite(llvm::Module &module, llvm::CallInst *call_inst) {
7719459580SLuke Drummond   (void)module;
7819459580SLuke Drummond   if (!call_inst->hasByValArgument())
7919459580SLuke Drummond     return false;
8019459580SLuke Drummond   for (const auto &param : call_inst->operand_values())
8119459580SLuke Drummond     if (isRSAllocationPtrTy(param->getType()))
8219459580SLuke Drummond       return true;
8319459580SLuke Drummond   return false;
8419459580SLuke Drummond }
8519459580SLuke Drummond 
86b9c1b51eSKate Stone llvm::FunctionType *cloneToStructRetFnTy(llvm::CallInst *call_inst) {
87b9c1b51eSKate Stone   // on x86 StructReturn functions return a pointer to the return value, rather
8805097246SAdrian Prantl   // than the return value itself
8905097246SAdrian Prantl   // [ref](http://www.agner.org/optimize/calling_conventions.pdf section 6). We
9005097246SAdrian Prantl   // create a return type by getting the pointer type of the old return type,
9105097246SAdrian Prantl   // and inserting a new initial argument of pointer type of the original
9205097246SAdrian Prantl   // return type.
93b9c1b51eSKate Stone   Log *log(
94b9c1b51eSKate Stone       GetLogIfAnyCategoriesSet(LIBLLDB_LOG_LANGUAGE | LIBLLDB_LOG_EXPRESSIONS));
9519459580SLuke Drummond 
9619459580SLuke Drummond   assert(call_inst && "no CallInst");
9719459580SLuke Drummond   llvm::Function *orig = call_inst->getCalledFunction();
9819459580SLuke Drummond   assert(orig && "CallInst has no called function");
9919459580SLuke Drummond   llvm::FunctionType *orig_type = orig->getFunctionType();
10019459580SLuke Drummond   auto name = orig->getName();
10119459580SLuke Drummond   if (log)
102b9c1b51eSKate Stone     log->Printf("%s - cloning to StructRet function for '%s'", __FUNCTION__,
103b9c1b51eSKate Stone                 name.str().c_str());
10419459580SLuke Drummond 
10519459580SLuke Drummond   unsigned num_params = orig_type->getNumParams();
1069d83de42SLuke Drummond   std::vector<llvm::Type *> new_params{num_params + 1, nullptr};
107b9c1b51eSKate Stone   std::vector<llvm::Type *> params{orig_type->param_begin(),
108b9c1b51eSKate Stone                                    orig_type->param_end()};
10919459580SLuke Drummond 
110b9c1b51eSKate Stone   // This may not work if the function is somehow declared void as llvm is
11105097246SAdrian Prantl   // strongly typed and represents void* with i8*
112b9c1b51eSKate Stone   assert(!orig_type->getReturnType()->isVoidTy() &&
113b9c1b51eSKate Stone          "Cannot add StructRet attribute to void function");
114b9c1b51eSKate Stone   llvm::PointerType *return_type_ptr_type =
115b9c1b51eSKate Stone       llvm::PointerType::getUnqual(orig->getReturnType());
116b9c1b51eSKate Stone   assert(return_type_ptr_type &&
117b9c1b51eSKate Stone          "failed to get function return type PointerType");
11819459580SLuke Drummond   if (!return_type_ptr_type)
11919459580SLuke Drummond     return nullptr;
12019459580SLuke Drummond 
12119459580SLuke Drummond   if (log)
122b9c1b51eSKate Stone     log->Printf("%s - return type pointer type for StructRet clone @ '0x%p':\n",
123b9c1b51eSKate Stone                 __FUNCTION__, (void *)return_type_ptr_type);
124*4ebdee0aSBruce Mitchener   // put the sret pointer argument in place at the beginning of the
12505097246SAdrian Prantl   // argument list.
12619459580SLuke Drummond   params.emplace(params.begin(), return_type_ptr_type);
12719459580SLuke Drummond   assert(params.size() == num_params + 1);
128b9c1b51eSKate Stone   return llvm::FunctionType::get(return_type_ptr_type, params,
129b9c1b51eSKate Stone                                  orig->isVarArg());
13019459580SLuke Drummond }
13119459580SLuke Drummond 
132b9c1b51eSKate Stone bool findRSCallSites(llvm::Module &module,
133b9c1b51eSKate Stone                      std::set<llvm::CallInst *> &rs_callsites,
134b9c1b51eSKate Stone                      bool (*predicate)(llvm::Module &, llvm::CallInst *)) {
13519459580SLuke Drummond   bool found = false;
13619459580SLuke Drummond 
13719459580SLuke Drummond   for (auto &func : module.getFunctionList())
13819459580SLuke Drummond     for (auto &block : func.getBasicBlockList())
139b9c1b51eSKate Stone       for (auto &inst : block) {
140b9c1b51eSKate Stone         llvm::CallInst *call_inst =
141b9c1b51eSKate Stone             llvm::dyn_cast_or_null<llvm::CallInst>(&inst);
14219459580SLuke Drummond         if (!call_inst || !call_inst->getCalledFunction())
14319459580SLuke Drummond           // This is not the call-site you are looking for...
14419459580SLuke Drummond           continue;
145b9c1b51eSKate Stone         if (isRSAPICall(module, call_inst) && predicate(module, call_inst)) {
14619459580SLuke Drummond           rs_callsites.insert(call_inst);
14719459580SLuke Drummond           found = true;
14819459580SLuke Drummond         }
14919459580SLuke Drummond       }
15019459580SLuke Drummond   return found;
15119459580SLuke Drummond }
15219459580SLuke Drummond 
153b9c1b51eSKate Stone bool fixupX86StructRetCalls(llvm::Module &module) {
15419459580SLuke Drummond   bool changed = false;
15505097246SAdrian Prantl   // changing a basic block while iterating over it seems to have some
15605097246SAdrian Prantl   // undefined behaviour going on so we find all RS callsites first, then fix
15705097246SAdrian Prantl   // them up after consuming the iterator.
15819459580SLuke Drummond   std::set<llvm::CallInst *> rs_callsites;
15919459580SLuke Drummond   if (!findRSCallSites(module, rs_callsites, isRSLargeReturnCall))
16019459580SLuke Drummond     return false;
16119459580SLuke Drummond 
162b9c1b51eSKate Stone   for (auto call_inst : rs_callsites) {
16319459580SLuke Drummond     llvm::FunctionType *new_func_type = cloneToStructRetFnTy(call_inst);
164b9c1b51eSKate Stone     assert(new_func_type &&
165b9c1b51eSKate Stone            "failed to clone functionType for Renderscript ABI fixup");
16619459580SLuke Drummond 
16719459580SLuke Drummond     llvm::CallSite call_site(call_inst);
16819459580SLuke Drummond     llvm::Function *func = call_inst->getCalledFunction();
16919459580SLuke Drummond     assert(func && "cannot resolve function in RenderScriptRuntime");
17019459580SLuke Drummond     // Copy the original call arguments
171b9c1b51eSKate Stone     std::vector<llvm::Value *> new_call_args(call_site.arg_begin(),
172b9c1b51eSKate Stone                                              call_site.arg_end());
17319459580SLuke Drummond 
17419459580SLuke Drummond     // Allocate enough space to store the return value of the original function
175b9c1b51eSKate Stone     // we pass a pointer to this allocation as the StructRet param, and then
17605097246SAdrian Prantl     // copy its value into the lldb return value
17775696ffaSMatt Arsenault     const llvm::DataLayout &DL = module.getDataLayout();
178b9c1b51eSKate Stone     llvm::AllocaInst *return_value_alloc = new llvm::AllocaInst(
17975696ffaSMatt Arsenault       func->getReturnType(), DL.getAllocaAddrSpace(), "var_vector_return_alloc",
18075696ffaSMatt Arsenault       call_inst);
18119459580SLuke Drummond     // use the new allocation as the new first argument
182b9c1b51eSKate Stone     new_call_args.emplace(new_call_args.begin(),
183b9c1b51eSKate Stone                           llvm::cast<llvm::Value>(return_value_alloc));
184b9c1b51eSKate Stone     llvm::PointerType *new_func_ptr_type =
185b9c1b51eSKate Stone         llvm::PointerType::get(new_func_type, 0);
18619459580SLuke Drummond     // Create the type cast from the old function type to the new one
187b9c1b51eSKate Stone     llvm::Constant *new_func_cast = llvm::ConstantExpr::getCast(
188b9c1b51eSKate Stone         llvm::Instruction::BitCast, func, new_func_ptr_type);
18919459580SLuke Drummond     // create an allocation for a new function pointer
190b9c1b51eSKate Stone     llvm::AllocaInst *new_func_ptr =
19175696ffaSMatt Arsenault         new llvm::AllocaInst(new_func_ptr_type, DL.getAllocaAddrSpace(),
19275696ffaSMatt Arsenault                              "new_func_ptr", call_inst);
19319459580SLuke Drummond     // store the new_func_cast to the newly allocated space
194a322f36cSDavid Blaikie     (new llvm::StoreInst(new_func_cast, new_func_ptr, call_inst))
195a322f36cSDavid Blaikie         ->setName("new_func_ptr_load_cast");
19619459580SLuke Drummond     // load the new function address ready for a jump
197b9c1b51eSKate Stone     llvm::LoadInst *new_func_addr_load =
198b9c1b51eSKate Stone         new llvm::LoadInst(new_func_ptr, "load_func_pointer", call_inst);
19919459580SLuke Drummond     // and create a callinstruction from it
200b9c1b51eSKate Stone     llvm::CallInst *new_call_inst = llvm::CallInst::Create(
201b9c1b51eSKate Stone         new_func_addr_load, new_call_args, "new_func_call", call_inst);
20219459580SLuke Drummond     new_call_inst->setCallingConv(call_inst->getCallingConv());
20319459580SLuke Drummond     new_call_inst->setTailCall(call_inst->isTailCall());
204b9c1b51eSKate Stone     llvm::LoadInst *lldb_save_result_address =
205b9c1b51eSKate Stone         new llvm::LoadInst(return_value_alloc, "save_return_val", call_inst);
20619459580SLuke Drummond 
20719459580SLuke Drummond     // Now remove the old broken call
20819459580SLuke Drummond     call_inst->replaceAllUsesWith(lldb_save_result_address);
20919459580SLuke Drummond     call_inst->eraseFromParent();
21019459580SLuke Drummond     changed = true;
21119459580SLuke Drummond   }
21219459580SLuke Drummond   return changed;
21319459580SLuke Drummond }
21419459580SLuke Drummond 
215b9c1b51eSKate Stone bool fixupRSAllocationStructByValCalls(llvm::Module &module) {
216b9c1b51eSKate Stone   // On x86_64, calls to functions in the RS runtime that take an
21705097246SAdrian Prantl   // `rs_allocation` type argument are actually handled as by-ref params by
21805097246SAdrian Prantl   // bcc, but appear to be passed by value by lldb (the callsite all use
21905097246SAdrian Prantl   // `struct byval`). On x86_64 Linux, struct arguments are transferred in
22005097246SAdrian Prantl   // registers if the struct size is no bigger than 128bits
22105097246SAdrian Prantl   // [ref](http://www.agner.org/optimize/calling_conventions.pdf) section 7.1
22205097246SAdrian Prantl   // "Passing and returning objects" otherwise passed on the stack. an object
22305097246SAdrian Prantl   // of type `rs_allocation` is actually 256bits, so should be passed on the
22405097246SAdrian Prantl   // stack. However, code generated by bcc actually treats formal params of
22505097246SAdrian Prantl   // type `rs_allocation` as `rs_allocation *` so we need to convert the
226b9c1b51eSKate Stone   // calling convention to pass by reference, and remove any hint of byval from
227b9c1b51eSKate Stone   // formal parameters.
22819459580SLuke Drummond   bool changed = false;
22919459580SLuke Drummond   std::set<llvm::CallInst *> rs_callsites;
23019459580SLuke Drummond   if (!findRSCallSites(module, rs_callsites, isRSAllocationTyCallSite))
23119459580SLuke Drummond     return false;
23219459580SLuke Drummond 
23319459580SLuke Drummond   std::set<llvm::Function *> rs_functions;
23419459580SLuke Drummond 
23519459580SLuke Drummond   // for all call instructions
236b9c1b51eSKate Stone   for (auto call_inst : rs_callsites) {
237b9c1b51eSKate Stone     // add the called function to a set so that we can strip its byval
238b9c1b51eSKate Stone     // attributes in another pass
23919459580SLuke Drummond     rs_functions.insert(call_inst->getCalledFunction());
24019459580SLuke Drummond 
24119459580SLuke Drummond     // get the function attributes
242a3e3715cSReid Kleckner     llvm::AttributeList call_attribs = call_inst->getAttributes();
24319459580SLuke Drummond 
24419459580SLuke Drummond     // iterate over the argument attributes
24502295000SStephane Sezer     for (unsigned I = call_attribs.index_begin(); I != call_attribs.index_end();
24602295000SStephane Sezer          I++) {
24719459580SLuke Drummond       // if this argument is passed by val
248e3bb52bbSStephane Sezer       if (call_attribs.hasAttribute(I, llvm::Attribute::ByVal)) {
24919459580SLuke Drummond         // strip away the byval attribute
250e3bb52bbSStephane Sezer         call_inst->removeAttribute(I, llvm::Attribute::ByVal);
25119459580SLuke Drummond         changed = true;
25219459580SLuke Drummond       }
25319459580SLuke Drummond     }
25419459580SLuke Drummond   }
25519459580SLuke Drummond 
25619459580SLuke Drummond   // for all called function decls
257b9c1b51eSKate Stone   for (auto func : rs_functions) {
25819459580SLuke Drummond     // inspect all of the arguments in the call
25920670ba5SReid Kleckner     for (auto &arg : func->args()) {
260b9c1b51eSKate Stone       if (arg.hasByValAttr()) {
261f76a8ac5SReid Kleckner         arg.removeAttr(llvm::Attribute::ByVal);
26219459580SLuke Drummond         changed = true;
26319459580SLuke Drummond       }
26419459580SLuke Drummond     }
26519459580SLuke Drummond   }
26619459580SLuke Drummond   return changed;
26719459580SLuke Drummond }
26819459580SLuke Drummond } // end anonymous namespace
26919459580SLuke Drummond 
270b9c1b51eSKate Stone namespace lldb_private {
271b9c1b51eSKate Stone namespace lldb_renderscript {
27219459580SLuke Drummond 
273b9c1b51eSKate Stone bool fixupX86FunctionCalls(llvm::Module &module) {
27419459580SLuke Drummond   return fixupX86StructRetCalls(module);
27519459580SLuke Drummond }
27619459580SLuke Drummond 
277b9c1b51eSKate Stone bool fixupX86_64FunctionCalls(llvm::Module &module) {
27819459580SLuke Drummond   bool changed = false;
27919459580SLuke Drummond   changed |= fixupX86StructRetCalls(module);
28019459580SLuke Drummond   changed |= fixupRSAllocationStructByValCalls(module);
28119459580SLuke Drummond   return changed;
28219459580SLuke Drummond }
28319459580SLuke Drummond 
28419459580SLuke Drummond } // end namespace lldb_renderscript
28519459580SLuke Drummond } // end namespace lldb_private
286