119459580SLuke Drummond //===-- x86ABIFixups.cpp ----------------------------------------*- C++ -*-===//
219459580SLuke Drummond //
319459580SLuke Drummond //                     The LLVM Compiler Infrastructure
419459580SLuke Drummond //
519459580SLuke Drummond // This file is distributed under the University of Illinois Open Source
619459580SLuke Drummond // License. See LICENSE.TXT for details.
719459580SLuke Drummond //
819459580SLuke Drummond //===----------------------------------------------------------------------===//
919459580SLuke Drummond 
1019459580SLuke Drummond // C Includes
1119459580SLuke Drummond // C++ Includes
1219459580SLuke Drummond #include <set>
1319459580SLuke Drummond 
1419459580SLuke Drummond // Other libraries and framework includes
1519459580SLuke Drummond #include "llvm/ADT/StringRef.h"
1619459580SLuke Drummond #include "llvm/IR/BasicBlock.h"
1719459580SLuke Drummond #include "llvm/IR/CallSite.h"
1819459580SLuke Drummond #include "llvm/IR/Constants.h"
1919459580SLuke Drummond #include "llvm/IR/Function.h"
2019459580SLuke Drummond #include "llvm/IR/Instruction.h"
2119459580SLuke Drummond #include "llvm/IR/Instructions.h"
2219459580SLuke Drummond #include "llvm/IR/Module.h"
2319459580SLuke Drummond #include "llvm/IRReader/IRReader.h"
2419459580SLuke Drummond #include "llvm/Pass.h"
2519459580SLuke Drummond 
2619459580SLuke Drummond // Project includes
2719459580SLuke Drummond #include "lldb/Core/Log.h"
2819459580SLuke Drummond #include "lldb/Target/Process.h"
2919459580SLuke Drummond 
3019459580SLuke Drummond using namespace lldb_private;
3119459580SLuke Drummond namespace
3219459580SLuke Drummond {
3319459580SLuke Drummond 
3419459580SLuke Drummond bool
3519459580SLuke Drummond isRSAPICall(llvm::Module &module, llvm::CallInst *call_inst)
3619459580SLuke Drummond {
3719459580SLuke Drummond     // TODO get the list of renderscript modules from lldb and check if
3819459580SLuke Drummond     // this llvm::Module calls into any of them.
3919459580SLuke Drummond     (void)module;
4019459580SLuke Drummond     const auto func_name = call_inst->getCalledFunction()->getName();
4119459580SLuke Drummond     if (func_name.startswith("llvm") || func_name.startswith("lldb"))
4219459580SLuke Drummond         return false;
4319459580SLuke Drummond 
4419459580SLuke Drummond     if (call_inst->getCalledFunction()->isIntrinsic())
4519459580SLuke Drummond         return false;
4619459580SLuke Drummond 
4719459580SLuke Drummond     return true;
4819459580SLuke Drummond }
4919459580SLuke Drummond 
5019459580SLuke Drummond bool
5119459580SLuke Drummond isRSLargeReturnCall(llvm::Module &module, llvm::CallInst *call_inst)
5219459580SLuke Drummond {
5319459580SLuke Drummond     // i686 and x86_64 returns for large vectors in the RenderScript API are not handled as normal
5419459580SLuke Drummond     // register pairs, but as a hidden sret type. This is not reflected in the debug info or mangled
5519459580SLuke Drummond     // symbol name, and the android ABI for x86 and x86_64, (as well as the emulators) specifies there is
5619459580SLuke Drummond     // no AVX, so bcc generates an sret function because we cannot natively return 256 bit vectors.
5719459580SLuke Drummond     // This function simply checks whether a function has a > 128bit return type. It is perhaps an
5819459580SLuke Drummond     // unreliable heuristic, and relies on bcc not generating AVX code, so if the android ABI one day
5919459580SLuke Drummond     // provides for AVX, this function may go out of fashion.
6019459580SLuke Drummond     (void)module;
6119459580SLuke Drummond     if (!call_inst || !call_inst->getCalledFunction())
6219459580SLuke Drummond         return false;
6319459580SLuke Drummond 
6419459580SLuke Drummond     return call_inst->getCalledFunction()->getReturnType()->getPrimitiveSizeInBits() > 128;
6519459580SLuke Drummond }
6619459580SLuke Drummond 
6719459580SLuke Drummond bool
6819459580SLuke Drummond isRSAllocationPtrTy(const llvm::Type *type)
6919459580SLuke Drummond {
7019459580SLuke Drummond     if (!type->isPointerTy())
7119459580SLuke Drummond         return false;
7219459580SLuke Drummond     auto ptr_type = type->getPointerElementType();
7319459580SLuke Drummond 
7419459580SLuke Drummond     return ptr_type->isStructTy() && ptr_type->getStructName().startswith("struct.rs_allocation");
7519459580SLuke Drummond }
7619459580SLuke Drummond 
7719459580SLuke Drummond bool
7819459580SLuke Drummond isRSAllocationTyCallSite(llvm::Module &module, llvm::CallInst *call_inst)
7919459580SLuke Drummond {
8019459580SLuke Drummond     (void)module;
8119459580SLuke Drummond     if (!call_inst->hasByValArgument())
8219459580SLuke Drummond         return false;
8319459580SLuke Drummond     for (const auto &param : call_inst->operand_values())
8419459580SLuke Drummond         if (isRSAllocationPtrTy(param->getType()))
8519459580SLuke Drummond             return true;
8619459580SLuke Drummond     return false;
8719459580SLuke Drummond }
8819459580SLuke Drummond 
8919459580SLuke Drummond llvm::FunctionType *
9019459580SLuke Drummond cloneToStructRetFnTy(llvm::CallInst *call_inst)
9119459580SLuke Drummond {
9219459580SLuke Drummond     // on x86 StructReturn functions return a pointer to the return value, rather than the return
9319459580SLuke Drummond     // value itself [ref](http://www.agner.org/optimize/calling_conventions.pdf section 6).
9419459580SLuke Drummond     // We create a return type by getting the pointer type of the old return type, and inserting a new
9519459580SLuke Drummond     // initial argument of pointer type of the original return type.
9619459580SLuke Drummond     Log *log(GetLogIfAnyCategoriesSet(LIBLLDB_LOG_LANGUAGE | LIBLLDB_LOG_EXPRESSIONS));
9719459580SLuke Drummond 
9819459580SLuke Drummond     assert(call_inst && "no CallInst");
9919459580SLuke Drummond     llvm::Function *orig = call_inst->getCalledFunction();
10019459580SLuke Drummond     assert(orig && "CallInst has no called function");
10119459580SLuke Drummond     llvm::FunctionType *orig_type = orig->getFunctionType();
10219459580SLuke Drummond     auto name = orig->getName();
10319459580SLuke Drummond     if (log)
10419459580SLuke Drummond         log->Printf("%s - cloning to StructRet function for '%s'", __FUNCTION__, name.str().c_str());
10519459580SLuke Drummond 
10619459580SLuke Drummond     unsigned num_params = orig_type->getNumParams();
107*9d83de42SLuke Drummond     std::vector<llvm::Type *> new_params{num_params + 1, nullptr};
10819459580SLuke Drummond     std::vector<llvm::Type *> params{orig_type->param_begin(), orig_type->param_end()};
10919459580SLuke Drummond 
11019459580SLuke Drummond     // This may not work if the function is somehow declared void as llvm is strongly typed
11119459580SLuke Drummond     // and represents void* with i8*
11219459580SLuke Drummond     assert(!orig_type->getReturnType()->isVoidTy() && "Cannot add StructRet attribute to void function");
11319459580SLuke Drummond     llvm::PointerType *return_type_ptr_type = llvm::PointerType::getUnqual(orig->getReturnType());
11419459580SLuke Drummond     assert(return_type_ptr_type && "failed to get function return type PointerType");
11519459580SLuke Drummond     if (!return_type_ptr_type)
11619459580SLuke Drummond         return nullptr;
11719459580SLuke Drummond 
11819459580SLuke Drummond     if (log)
11919459580SLuke Drummond         log->Printf("%s - return type pointer type for StructRet clone @ '0x%p':\n", __FUNCTION__,
12019459580SLuke Drummond                     (void *)return_type_ptr_type);
12119459580SLuke Drummond     // put the the sret pointer argument in place at the beginning of the argument list.
12219459580SLuke Drummond     params.emplace(params.begin(), return_type_ptr_type);
12319459580SLuke Drummond     assert(params.size() == num_params + 1);
12419459580SLuke Drummond     return llvm::FunctionType::get(return_type_ptr_type, params, orig->isVarArg());
12519459580SLuke Drummond }
12619459580SLuke Drummond 
12719459580SLuke Drummond bool
12819459580SLuke Drummond findRSCallSites(llvm::Module &module, std::set<llvm::CallInst *> &rs_callsites,
12919459580SLuke Drummond                 bool (*predicate)(llvm::Module &, llvm::CallInst *))
13019459580SLuke Drummond {
13119459580SLuke Drummond     bool found = false;
13219459580SLuke Drummond 
13319459580SLuke Drummond     for (auto &func : module.getFunctionList())
13419459580SLuke Drummond         for (auto &block : func.getBasicBlockList())
13519459580SLuke Drummond             for (auto &inst : block)
13619459580SLuke Drummond             {
13719459580SLuke Drummond                 llvm::CallInst *call_inst = llvm::dyn_cast_or_null<llvm::CallInst>(&inst);
13819459580SLuke Drummond                 if (!call_inst || !call_inst->getCalledFunction())
13919459580SLuke Drummond                     // This is not the call-site you are looking for...
14019459580SLuke Drummond                     continue;
14119459580SLuke Drummond                 if (isRSAPICall(module, call_inst) && predicate(module, call_inst))
14219459580SLuke Drummond                 {
14319459580SLuke Drummond                     rs_callsites.insert(call_inst);
14419459580SLuke Drummond                     found = true;
14519459580SLuke Drummond                 }
14619459580SLuke Drummond             }
14719459580SLuke Drummond     return found;
14819459580SLuke Drummond }
14919459580SLuke Drummond 
15019459580SLuke Drummond bool
15119459580SLuke Drummond fixupX86StructRetCalls(llvm::Module &module)
15219459580SLuke Drummond {
15319459580SLuke Drummond     bool changed = false;
15419459580SLuke Drummond     // changing a basic block while iterating over it seems to have some undefined behaviour
15519459580SLuke Drummond     // going on so we find all RS callsites first, then fix them up after consuming
15619459580SLuke Drummond     // the iterator.
15719459580SLuke Drummond     std::set<llvm::CallInst *> rs_callsites;
15819459580SLuke Drummond     if (!findRSCallSites(module, rs_callsites, isRSLargeReturnCall))
15919459580SLuke Drummond         return false;
16019459580SLuke Drummond 
16119459580SLuke Drummond     for (auto call_inst : rs_callsites)
16219459580SLuke Drummond     {
16319459580SLuke Drummond         llvm::FunctionType *new_func_type = cloneToStructRetFnTy(call_inst);
16419459580SLuke Drummond         assert(new_func_type && "failed to clone functionType for Renderscript ABI fixup");
16519459580SLuke Drummond 
16619459580SLuke Drummond         llvm::CallSite call_site(call_inst);
16719459580SLuke Drummond         llvm::Function *func = call_inst->getCalledFunction();
16819459580SLuke Drummond         assert(func && "cannot resolve function in RenderScriptRuntime");
16919459580SLuke Drummond         // Copy the original call arguments
17019459580SLuke Drummond         std::vector<llvm::Value *> new_call_args(call_site.arg_begin(), call_site.arg_end());
17119459580SLuke Drummond 
17219459580SLuke Drummond         // Allocate enough space to store the return value of the original function
17319459580SLuke Drummond         // we pass a pointer to this allocation as the StructRet param, and then copy its
17419459580SLuke Drummond         // value into the lldb return value
17519459580SLuke Drummond         llvm::AllocaInst *return_value_alloc =
17619459580SLuke Drummond             new llvm::AllocaInst(func->getReturnType(), "var_vector_return_alloc", call_inst);
17719459580SLuke Drummond         // use the new allocation as the new first argument
17819459580SLuke Drummond         new_call_args.emplace(new_call_args.begin(), llvm::cast<llvm::Value>(return_value_alloc));
17919459580SLuke Drummond         llvm::PointerType *new_func_ptr_type = llvm::PointerType::get(new_func_type, 0);
18019459580SLuke Drummond         // Create the type cast from the old function type to the new one
18119459580SLuke Drummond         llvm::Constant *new_func_cast =
18219459580SLuke Drummond             llvm::ConstantExpr::getCast(llvm::Instruction::BitCast, func, new_func_ptr_type);
18319459580SLuke Drummond         // create an allocation for a new function pointer
18419459580SLuke Drummond         llvm::AllocaInst *new_func_ptr = new llvm::AllocaInst(new_func_ptr_type, "new_func_ptr", call_inst);
18519459580SLuke Drummond         // store the new_func_cast to the newly allocated space
18619459580SLuke Drummond         (void)new llvm::StoreInst(new_func_cast, new_func_ptr, "new_func_ptr_load_cast", call_inst);
18719459580SLuke Drummond         // load the new function address ready for a jump
18819459580SLuke Drummond         llvm::LoadInst *new_func_addr_load = new llvm::LoadInst(new_func_ptr, "load_func_pointer", call_inst);
18919459580SLuke Drummond         // and create a callinstruction from it
19019459580SLuke Drummond         llvm::CallInst *new_call_inst =
19119459580SLuke Drummond             llvm::CallInst::Create(new_func_addr_load, new_call_args, "new_func_call", call_inst);
19219459580SLuke Drummond         new_call_inst->setCallingConv(call_inst->getCallingConv());
19319459580SLuke Drummond         new_call_inst->setTailCall(call_inst->isTailCall());
19419459580SLuke Drummond         llvm::LoadInst *lldb_save_result_address = new llvm::LoadInst(return_value_alloc, "save_return_val", call_inst);
19519459580SLuke Drummond 
19619459580SLuke Drummond         // Now remove the old broken call
19719459580SLuke Drummond         call_inst->replaceAllUsesWith(lldb_save_result_address);
19819459580SLuke Drummond         call_inst->eraseFromParent();
19919459580SLuke Drummond         changed = true;
20019459580SLuke Drummond     }
20119459580SLuke Drummond     return changed;
20219459580SLuke Drummond }
20319459580SLuke Drummond 
20419459580SLuke Drummond bool
20519459580SLuke Drummond fixupRSAllocationStructByValCalls(llvm::Module &module)
20619459580SLuke Drummond {
20719459580SLuke Drummond     // On x86_64, calls to functions in the RS runtime that take an `rs_allocation` type argument
20819459580SLuke Drummond     // are actually handled as by-ref params by bcc, but appear to be passed by value by lldb (the callsite all use
20919459580SLuke Drummond     // `struct byval`).
21019459580SLuke Drummond     // On x86_64 Linux, struct arguments are transferred in registers if the struct size is no bigger than
21119459580SLuke Drummond     // 128bits [ref](http://www.agner.org/optimize/calling_conventions.pdf) section 7.1 "Passing and returning objects"
21219459580SLuke Drummond     // otherwise passed on the stack.
21319459580SLuke Drummond     // an object of type `rs_allocation` is actually 256bits, so should be passed on the stack. However, code generated
21419459580SLuke Drummond     // by bcc actually treats formal params of type `rs_allocation` as `rs_allocation *` so we need to convert the
21519459580SLuke Drummond     // calling convention to pass by reference, and remove any hint of byval from formal parameters.
21619459580SLuke Drummond     bool changed = false;
21719459580SLuke Drummond     std::set<llvm::CallInst *> rs_callsites;
21819459580SLuke Drummond     if (!findRSCallSites(module, rs_callsites, isRSAllocationTyCallSite))
21919459580SLuke Drummond         return false;
22019459580SLuke Drummond 
22119459580SLuke Drummond     std::set<llvm::Function *> rs_functions;
22219459580SLuke Drummond 
22319459580SLuke Drummond     // for all call instructions
22419459580SLuke Drummond     for (auto call_inst : rs_callsites)
22519459580SLuke Drummond     {
22619459580SLuke Drummond         // add the called function to a set so that we can strip its byval attributes in another pass
22719459580SLuke Drummond         rs_functions.insert(call_inst->getCalledFunction());
22819459580SLuke Drummond 
22919459580SLuke Drummond         // get the function attributes
23019459580SLuke Drummond         llvm::AttributeSet call_attribs = call_inst->getAttributes();
23119459580SLuke Drummond 
23219459580SLuke Drummond         // iterate over the argument attributes
23319459580SLuke Drummond         for (size_t i = 1; i <= call_attribs.getNumSlots(); ++i)
23419459580SLuke Drummond         {
23519459580SLuke Drummond             // if this argument is passed by val
23619459580SLuke Drummond             if (call_attribs.hasAttribute(i, llvm::Attribute::ByVal))
23719459580SLuke Drummond             {
23819459580SLuke Drummond                 // strip away the byval attribute
23919459580SLuke Drummond                 call_inst->removeAttribute(i, llvm::Attribute::get(module.getContext(), llvm::Attribute::ByVal));
24019459580SLuke Drummond                 changed = true;
24119459580SLuke Drummond             }
24219459580SLuke Drummond         }
24319459580SLuke Drummond     }
24419459580SLuke Drummond 
24519459580SLuke Drummond     llvm::AttributeSet attr_byval = llvm::AttributeSet::get(module.getContext(), 1u, llvm::Attribute::ByVal);
24619459580SLuke Drummond 
24719459580SLuke Drummond     // for all called function decls
24819459580SLuke Drummond     for (auto func : rs_functions)
24919459580SLuke Drummond     {
25019459580SLuke Drummond         // inspect all of the arguments in the call
25119459580SLuke Drummond         llvm::SymbolTableList<llvm::Argument> &argList = func->getArgumentList();
25219459580SLuke Drummond         for (auto &arg : argList)
25319459580SLuke Drummond         {
25419459580SLuke Drummond             if (arg.hasByValAttr())
25519459580SLuke Drummond             {
25619459580SLuke Drummond                 arg.removeAttr(attr_byval);
25719459580SLuke Drummond                 changed = true;
25819459580SLuke Drummond             }
25919459580SLuke Drummond         }
26019459580SLuke Drummond     }
26119459580SLuke Drummond     return changed;
26219459580SLuke Drummond }
26319459580SLuke Drummond } // end anonymous namespace
26419459580SLuke Drummond 
26519459580SLuke Drummond namespace lldb_private
26619459580SLuke Drummond {
26719459580SLuke Drummond namespace lldb_renderscript
26819459580SLuke Drummond {
26919459580SLuke Drummond 
27019459580SLuke Drummond bool
27119459580SLuke Drummond fixupX86FunctionCalls(llvm::Module &module)
27219459580SLuke Drummond {
27319459580SLuke Drummond     return fixupX86StructRetCalls(module);
27419459580SLuke Drummond }
27519459580SLuke Drummond 
27619459580SLuke Drummond bool
27719459580SLuke Drummond fixupX86_64FunctionCalls(llvm::Module &module)
27819459580SLuke Drummond {
27919459580SLuke Drummond     bool changed = false;
28019459580SLuke Drummond     changed |= fixupX86StructRetCalls(module);
28119459580SLuke Drummond     changed |= fixupRSAllocationStructByValCalls(module);
28219459580SLuke Drummond     return changed;
28319459580SLuke Drummond }
28419459580SLuke Drummond 
28519459580SLuke Drummond } // end namespace lldb_renderscript
28619459580SLuke Drummond } // end namespace lldb_private
287