180814287SRaphael Isemann //===-- RenderScriptx86ABIFixups.cpp --------------------------------------===//
219459580SLuke Drummond //
32946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
42946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information.
52946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
619459580SLuke Drummond //
719459580SLuke Drummond //===----------------------------------------------------------------------===//
819459580SLuke Drummond 
919459580SLuke Drummond #include <set>
1019459580SLuke Drummond 
1119459580SLuke Drummond #include "llvm/ADT/StringRef.h"
1219459580SLuke Drummond #include "llvm/IR/BasicBlock.h"
1319459580SLuke Drummond #include "llvm/IR/Constants.h"
1419459580SLuke Drummond #include "llvm/IR/Function.h"
1519459580SLuke Drummond #include "llvm/IR/Instruction.h"
1619459580SLuke Drummond #include "llvm/IR/Instructions.h"
1719459580SLuke Drummond #include "llvm/IR/Module.h"
1819459580SLuke Drummond #include "llvm/IRReader/IRReader.h"
1919459580SLuke Drummond #include "llvm/Pass.h"
2019459580SLuke Drummond 
2119459580SLuke Drummond #include "lldb/Target/Process.h"
226f9e6901SZachary Turner #include "lldb/Utility/Log.h"
2319459580SLuke Drummond 
2419459580SLuke Drummond using namespace lldb_private;
2519459580SLuke Drummond 
26*93c1b3caSPavel Labath static bool isRSAPICall(llvm::Module &module, llvm::CallInst *call_inst) {
2719459580SLuke Drummond   // TODO get the list of renderscript modules from lldb and check if
2819459580SLuke Drummond   // this llvm::Module calls into any of them.
2919459580SLuke Drummond   (void)module;
3019459580SLuke Drummond   const auto func_name = call_inst->getCalledFunction()->getName();
3119459580SLuke Drummond   if (func_name.startswith("llvm") || func_name.startswith("lldb"))
3219459580SLuke Drummond     return false;
3319459580SLuke Drummond 
3419459580SLuke Drummond   if (call_inst->getCalledFunction()->isIntrinsic())
3519459580SLuke Drummond     return false;
3619459580SLuke Drummond 
3719459580SLuke Drummond   return true;
3819459580SLuke Drummond }
3919459580SLuke Drummond 
40*93c1b3caSPavel Labath static bool isRSLargeReturnCall(llvm::Module &module,
41*93c1b3caSPavel Labath                                 llvm::CallInst *call_inst) {
42b9c1b51eSKate Stone   // i686 and x86_64 returns for large vectors in the RenderScript API are not
4305097246SAdrian Prantl   // handled as normal register pairs, but as a hidden sret type. This is not
4405097246SAdrian Prantl   // reflected in the debug info or mangled symbol name, and the android ABI
4505097246SAdrian Prantl   // for x86 and x86_64, (as well as the emulators) specifies there is no AVX,
4605097246SAdrian Prantl   // so bcc generates an sret function because we cannot natively return
47b9c1b51eSKate Stone   // 256 bit vectors.
48b9c1b51eSKate Stone   // This function simply checks whether a function has a > 128bit return type.
4905097246SAdrian Prantl   // It is perhaps an unreliable heuristic, and relies on bcc not generating
5005097246SAdrian Prantl   // AVX code, so if the android ABI one day provides for AVX, this function
5105097246SAdrian Prantl   // may go out of fashion.
5219459580SLuke Drummond   (void)module;
5319459580SLuke Drummond   if (!call_inst || !call_inst->getCalledFunction())
5419459580SLuke Drummond     return false;
5519459580SLuke Drummond 
56b9c1b51eSKate Stone   return call_inst->getCalledFunction()
57b9c1b51eSKate Stone              ->getReturnType()
58b9c1b51eSKate Stone              ->getPrimitiveSizeInBits() > 128;
5919459580SLuke Drummond }
6019459580SLuke Drummond 
61*93c1b3caSPavel Labath static bool isRSAllocationPtrTy(const llvm::Type *type) {
6219459580SLuke Drummond   if (!type->isPointerTy())
6319459580SLuke Drummond     return false;
6419459580SLuke Drummond   auto ptr_type = type->getPointerElementType();
6519459580SLuke Drummond 
66b9c1b51eSKate Stone   return ptr_type->isStructTy() &&
67b9c1b51eSKate Stone          ptr_type->getStructName().startswith("struct.rs_allocation");
6819459580SLuke Drummond }
6919459580SLuke Drummond 
70*93c1b3caSPavel Labath static bool isRSAllocationTyCallSite(llvm::Module &module,
71*93c1b3caSPavel Labath                                      llvm::CallInst *call_inst) {
7219459580SLuke Drummond   (void)module;
7319459580SLuke Drummond   if (!call_inst->hasByValArgument())
7419459580SLuke Drummond     return false;
758dc7b982SMark de Wever   for (const auto *param : call_inst->operand_values())
7619459580SLuke Drummond     if (isRSAllocationPtrTy(param->getType()))
7719459580SLuke Drummond       return true;
7819459580SLuke Drummond   return false;
7919459580SLuke Drummond }
8019459580SLuke Drummond 
81*93c1b3caSPavel Labath static llvm::FunctionType *cloneToStructRetFnTy(llvm::CallInst *call_inst) {
82b9c1b51eSKate Stone   // on x86 StructReturn functions return a pointer to the return value, rather
8305097246SAdrian Prantl   // than the return value itself
8405097246SAdrian Prantl   // [ref](http://www.agner.org/optimize/calling_conventions.pdf section 6). We
8505097246SAdrian Prantl   // create a return type by getting the pointer type of the old return type,
8605097246SAdrian Prantl   // and inserting a new initial argument of pointer type of the original
8705097246SAdrian Prantl   // return type.
88b9c1b51eSKate Stone   Log *log(
89b9c1b51eSKate Stone       GetLogIfAnyCategoriesSet(LIBLLDB_LOG_LANGUAGE | LIBLLDB_LOG_EXPRESSIONS));
9019459580SLuke Drummond 
9119459580SLuke Drummond   assert(call_inst && "no CallInst");
9219459580SLuke Drummond   llvm::Function *orig = call_inst->getCalledFunction();
9319459580SLuke Drummond   assert(orig && "CallInst has no called function");
9419459580SLuke Drummond   llvm::FunctionType *orig_type = orig->getFunctionType();
9519459580SLuke Drummond   auto name = orig->getName();
9663e5fb76SJonas Devlieghere   LLDB_LOGF(log, "%s - cloning to StructRet function for '%s'", __FUNCTION__,
97b9c1b51eSKate Stone             name.str().c_str());
9819459580SLuke Drummond 
9919459580SLuke Drummond   unsigned num_params = orig_type->getNumParams();
1009d83de42SLuke Drummond   std::vector<llvm::Type *> new_params{num_params + 1, nullptr};
101b9c1b51eSKate Stone   std::vector<llvm::Type *> params{orig_type->param_begin(),
102b9c1b51eSKate Stone                                    orig_type->param_end()};
10319459580SLuke Drummond 
104b9c1b51eSKate Stone   // This may not work if the function is somehow declared void as llvm is
10505097246SAdrian Prantl   // strongly typed and represents void* with i8*
106b9c1b51eSKate Stone   assert(!orig_type->getReturnType()->isVoidTy() &&
107b9c1b51eSKate Stone          "Cannot add StructRet attribute to void function");
108b9c1b51eSKate Stone   llvm::PointerType *return_type_ptr_type =
109b9c1b51eSKate Stone       llvm::PointerType::getUnqual(orig->getReturnType());
110b9c1b51eSKate Stone   assert(return_type_ptr_type &&
111b9c1b51eSKate Stone          "failed to get function return type PointerType");
11219459580SLuke Drummond   if (!return_type_ptr_type)
11319459580SLuke Drummond     return nullptr;
11419459580SLuke Drummond 
11563e5fb76SJonas Devlieghere   LLDB_LOGF(log,
11663e5fb76SJonas Devlieghere             "%s - return type pointer type for StructRet clone @ '0x%p':\n",
117b9c1b51eSKate Stone             __FUNCTION__, (void *)return_type_ptr_type);
1184ebdee0aSBruce Mitchener   // put the sret pointer argument in place at the beginning of the
11905097246SAdrian Prantl   // argument list.
12019459580SLuke Drummond   params.emplace(params.begin(), return_type_ptr_type);
12119459580SLuke Drummond   assert(params.size() == num_params + 1);
122b9c1b51eSKate Stone   return llvm::FunctionType::get(return_type_ptr_type, params,
123b9c1b51eSKate Stone                                  orig->isVarArg());
12419459580SLuke Drummond }
12519459580SLuke Drummond 
126*93c1b3caSPavel Labath static bool
127*93c1b3caSPavel Labath findRSCallSites(llvm::Module &module, std::set<llvm::CallInst *> &rs_callsites,
128b9c1b51eSKate Stone                 bool (*predicate)(llvm::Module &, llvm::CallInst *)) {
12919459580SLuke Drummond   bool found = false;
13019459580SLuke Drummond 
13119459580SLuke Drummond   for (auto &func : module.getFunctionList())
13219459580SLuke Drummond     for (auto &block : func.getBasicBlockList())
133b9c1b51eSKate Stone       for (auto &inst : block) {
134b9c1b51eSKate Stone         llvm::CallInst *call_inst =
135b9c1b51eSKate Stone             llvm::dyn_cast_or_null<llvm::CallInst>(&inst);
13619459580SLuke Drummond         if (!call_inst || !call_inst->getCalledFunction())
13719459580SLuke Drummond           // This is not the call-site you are looking for...
13819459580SLuke Drummond           continue;
139b9c1b51eSKate Stone         if (isRSAPICall(module, call_inst) && predicate(module, call_inst)) {
14019459580SLuke Drummond           rs_callsites.insert(call_inst);
14119459580SLuke Drummond           found = true;
14219459580SLuke Drummond         }
14319459580SLuke Drummond       }
14419459580SLuke Drummond   return found;
14519459580SLuke Drummond }
14619459580SLuke Drummond 
147*93c1b3caSPavel Labath static bool fixupX86StructRetCalls(llvm::Module &module) {
14819459580SLuke Drummond   bool changed = false;
14905097246SAdrian Prantl   // changing a basic block while iterating over it seems to have some
15005097246SAdrian Prantl   // undefined behaviour going on so we find all RS callsites first, then fix
15105097246SAdrian Prantl   // them up after consuming the iterator.
15219459580SLuke Drummond   std::set<llvm::CallInst *> rs_callsites;
15319459580SLuke Drummond   if (!findRSCallSites(module, rs_callsites, isRSLargeReturnCall))
15419459580SLuke Drummond     return false;
15519459580SLuke Drummond 
156b9c1b51eSKate Stone   for (auto call_inst : rs_callsites) {
15719459580SLuke Drummond     llvm::FunctionType *new_func_type = cloneToStructRetFnTy(call_inst);
158b9c1b51eSKate Stone     assert(new_func_type &&
159b9c1b51eSKate Stone            "failed to clone functionType for Renderscript ABI fixup");
16019459580SLuke Drummond 
16119459580SLuke Drummond     llvm::Function *func = call_inst->getCalledFunction();
16219459580SLuke Drummond     assert(func && "cannot resolve function in RenderScriptRuntime");
16319459580SLuke Drummond     // Copy the original call arguments
1645948dafcSMircea Trofin     std::vector<llvm::Value *> new_call_args(call_inst->arg_begin(),
1655948dafcSMircea Trofin                                              call_inst->arg_end());
16619459580SLuke Drummond 
16719459580SLuke Drummond     // Allocate enough space to store the return value of the original function
168b9c1b51eSKate Stone     // we pass a pointer to this allocation as the StructRet param, and then
16905097246SAdrian Prantl     // copy its value into the lldb return value
17075696ffaSMatt Arsenault     const llvm::DataLayout &DL = module.getDataLayout();
171b9c1b51eSKate Stone     llvm::AllocaInst *return_value_alloc = new llvm::AllocaInst(
17275696ffaSMatt Arsenault       func->getReturnType(), DL.getAllocaAddrSpace(), "var_vector_return_alloc",
17375696ffaSMatt Arsenault       call_inst);
17419459580SLuke Drummond     // use the new allocation as the new first argument
175b9c1b51eSKate Stone     new_call_args.emplace(new_call_args.begin(),
176b9c1b51eSKate Stone                           llvm::cast<llvm::Value>(return_value_alloc));
177b9c1b51eSKate Stone     llvm::PointerType *new_func_ptr_type =
178b9c1b51eSKate Stone         llvm::PointerType::get(new_func_type, 0);
17919459580SLuke Drummond     // Create the type cast from the old function type to the new one
180b9c1b51eSKate Stone     llvm::Constant *new_func_cast = llvm::ConstantExpr::getCast(
181b9c1b51eSKate Stone         llvm::Instruction::BitCast, func, new_func_ptr_type);
18219459580SLuke Drummond     // create an allocation for a new function pointer
183b9c1b51eSKate Stone     llvm::AllocaInst *new_func_ptr =
18475696ffaSMatt Arsenault         new llvm::AllocaInst(new_func_ptr_type, DL.getAllocaAddrSpace(),
18575696ffaSMatt Arsenault                              "new_func_ptr", call_inst);
18619459580SLuke Drummond     // store the new_func_cast to the newly allocated space
187a322f36cSDavid Blaikie     (new llvm::StoreInst(new_func_cast, new_func_ptr, call_inst))
188a322f36cSDavid Blaikie         ->setName("new_func_ptr_load_cast");
18919459580SLuke Drummond     // load the new function address ready for a jump
190b9c1b51eSKate Stone     llvm::LoadInst *new_func_addr_load =
1916612b826SMed Ismail Bennani         new llvm::LoadInst(new_func_ptr->getType()->getPointerElementType(),
1926612b826SMed Ismail Bennani                            new_func_ptr, "load_func_pointer", call_inst);
19319459580SLuke Drummond     // and create a callinstruction from it
194ae2f9512SJames Y Knight     llvm::CallInst *new_call_inst =
195ae2f9512SJames Y Knight         llvm::CallInst::Create(new_func_type, new_func_addr_load, new_call_args,
196ae2f9512SJames Y Knight                                "new_func_call", call_inst);
19719459580SLuke Drummond     new_call_inst->setCallingConv(call_inst->getCallingConv());
19819459580SLuke Drummond     new_call_inst->setTailCall(call_inst->isTailCall());
1996612b826SMed Ismail Bennani     llvm::LoadInst *lldb_save_result_address = new llvm::LoadInst(
2006612b826SMed Ismail Bennani         return_value_alloc->getType()->getPointerElementType(),
2016612b826SMed Ismail Bennani         return_value_alloc, "save_return_val", call_inst);
20219459580SLuke Drummond 
20319459580SLuke Drummond     // Now remove the old broken call
20419459580SLuke Drummond     call_inst->replaceAllUsesWith(lldb_save_result_address);
20519459580SLuke Drummond     call_inst->eraseFromParent();
20619459580SLuke Drummond     changed = true;
20719459580SLuke Drummond   }
20819459580SLuke Drummond   return changed;
20919459580SLuke Drummond }
21019459580SLuke Drummond 
211*93c1b3caSPavel Labath static bool fixupRSAllocationStructByValCalls(llvm::Module &module) {
212b9c1b51eSKate Stone   // On x86_64, calls to functions in the RS runtime that take an
21305097246SAdrian Prantl   // `rs_allocation` type argument are actually handled as by-ref params by
21405097246SAdrian Prantl   // bcc, but appear to be passed by value by lldb (the callsite all use
21505097246SAdrian Prantl   // `struct byval`). On x86_64 Linux, struct arguments are transferred in
21605097246SAdrian Prantl   // registers if the struct size is no bigger than 128bits
21705097246SAdrian Prantl   // [ref](http://www.agner.org/optimize/calling_conventions.pdf) section 7.1
21805097246SAdrian Prantl   // "Passing and returning objects" otherwise passed on the stack. an object
21905097246SAdrian Prantl   // of type `rs_allocation` is actually 256bits, so should be passed on the
22005097246SAdrian Prantl   // stack. However, code generated by bcc actually treats formal params of
22105097246SAdrian Prantl   // type `rs_allocation` as `rs_allocation *` so we need to convert the
222b9c1b51eSKate Stone   // calling convention to pass by reference, and remove any hint of byval from
223b9c1b51eSKate Stone   // formal parameters.
22419459580SLuke Drummond   bool changed = false;
22519459580SLuke Drummond   std::set<llvm::CallInst *> rs_callsites;
22619459580SLuke Drummond   if (!findRSCallSites(module, rs_callsites, isRSAllocationTyCallSite))
22719459580SLuke Drummond     return false;
22819459580SLuke Drummond 
22919459580SLuke Drummond   std::set<llvm::Function *> rs_functions;
23019459580SLuke Drummond 
23119459580SLuke Drummond   // for all call instructions
232b9c1b51eSKate Stone   for (auto call_inst : rs_callsites) {
233b9c1b51eSKate Stone     // add the called function to a set so that we can strip its byval
234b9c1b51eSKate Stone     // attributes in another pass
23519459580SLuke Drummond     rs_functions.insert(call_inst->getCalledFunction());
23619459580SLuke Drummond 
23719459580SLuke Drummond     // get the function attributes
238a3e3715cSReid Kleckner     llvm::AttributeList call_attribs = call_inst->getAttributes();
23919459580SLuke Drummond 
24019459580SLuke Drummond     // iterate over the argument attributes
241a7b4ce9cSArthur Eubanks     for (unsigned I : call_attribs.indexes()) {
24219459580SLuke Drummond       // if this argument is passed by val
243ebbf7f90SArthur Eubanks       if (call_attribs.hasAttributeAtIndex(I, llvm::Attribute::ByVal)) {
24419459580SLuke Drummond         // strip away the byval attribute
245ebbf7f90SArthur Eubanks         call_inst->removeAttributeAtIndex(I, llvm::Attribute::ByVal);
24619459580SLuke Drummond         changed = true;
24719459580SLuke Drummond       }
24819459580SLuke Drummond     }
24919459580SLuke Drummond   }
25019459580SLuke Drummond 
25119459580SLuke Drummond   // for all called function decls
252b9c1b51eSKate Stone   for (auto func : rs_functions) {
25319459580SLuke Drummond     // inspect all of the arguments in the call
25420670ba5SReid Kleckner     for (auto &arg : func->args()) {
255b9c1b51eSKate Stone       if (arg.hasByValAttr()) {
256f76a8ac5SReid Kleckner         arg.removeAttr(llvm::Attribute::ByVal);
25719459580SLuke Drummond         changed = true;
25819459580SLuke Drummond       }
25919459580SLuke Drummond     }
26019459580SLuke Drummond   }
26119459580SLuke Drummond   return changed;
26219459580SLuke Drummond }
26319459580SLuke Drummond 
264b9c1b51eSKate Stone namespace lldb_private {
265b9c1b51eSKate Stone namespace lldb_renderscript {
26619459580SLuke Drummond 
267b9c1b51eSKate Stone bool fixupX86FunctionCalls(llvm::Module &module) {
26819459580SLuke Drummond   return fixupX86StructRetCalls(module);
26919459580SLuke Drummond }
27019459580SLuke Drummond 
271b9c1b51eSKate Stone bool fixupX86_64FunctionCalls(llvm::Module &module) {
27219459580SLuke Drummond   bool changed = false;
27319459580SLuke Drummond   changed |= fixupX86StructRetCalls(module);
27419459580SLuke Drummond   changed |= fixupRSAllocationStructByValCalls(module);
27519459580SLuke Drummond   return changed;
27619459580SLuke Drummond }
27719459580SLuke Drummond 
27819459580SLuke Drummond } // end namespace lldb_renderscript
27919459580SLuke Drummond } // end namespace lldb_private
280