1 //===-- IRDynamicChecks.cpp -------------------------------------*- C++ -*-===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9
10 #include "llvm/IR/Constants.h"
11 #include "llvm/IR/DataLayout.h"
12 #include "llvm/IR/Function.h"
13 #include "llvm/IR/Instructions.h"
14 #include "llvm/IR/Module.h"
15 #include "llvm/IR/Value.h"
16 #include "llvm/Support/raw_ostream.h"
17
18 #include "lldb/Expression/IRDynamicChecks.h"
19
20 #include "lldb/Expression/UtilityFunction.h"
21 #include "lldb/Target/ExecutionContext.h"
22 #include "lldb/Target/ObjCLanguageRuntime.h"
23 #include "lldb/Target/Process.h"
24 #include "lldb/Target/StackFrame.h"
25 #include "lldb/Target/Target.h"
26 #include "lldb/Utility/ConstString.h"
27 #include "lldb/Utility/Log.h"
28
29 using namespace llvm;
30 using namespace lldb_private;
31
32 static char ID;
33
34 #define VALID_POINTER_CHECK_NAME "_$__lldb_valid_pointer_check"
35 #define VALID_OBJC_OBJECT_CHECK_NAME "$__lldb_objc_object_check"
36
37 static const char g_valid_pointer_check_text[] =
38 "extern \"C\" void\n"
39 "_$__lldb_valid_pointer_check (unsigned char *$__lldb_arg_ptr)\n"
40 "{\n"
41 " unsigned char $__lldb_local_val = *$__lldb_arg_ptr;\n"
42 "}";
43
44 DynamicCheckerFunctions::DynamicCheckerFunctions() = default;
45
46 DynamicCheckerFunctions::~DynamicCheckerFunctions() = default;
47
Install(DiagnosticManager & diagnostic_manager,ExecutionContext & exe_ctx)48 bool DynamicCheckerFunctions::Install(DiagnosticManager &diagnostic_manager,
49 ExecutionContext &exe_ctx) {
50 Status error;
51 m_valid_pointer_check.reset(
52 exe_ctx.GetTargetRef().GetUtilityFunctionForLanguage(
53 g_valid_pointer_check_text, lldb::eLanguageTypeC,
54 VALID_POINTER_CHECK_NAME, error));
55 if (error.Fail())
56 return false;
57
58 if (!m_valid_pointer_check->Install(diagnostic_manager, exe_ctx))
59 return false;
60
61 Process *process = exe_ctx.GetProcessPtr();
62
63 if (process) {
64 ObjCLanguageRuntime *objc_language_runtime =
65 process->GetObjCLanguageRuntime();
66
67 if (objc_language_runtime) {
68 m_objc_object_check.reset(objc_language_runtime->CreateObjectChecker(
69 VALID_OBJC_OBJECT_CHECK_NAME));
70
71 if (!m_objc_object_check->Install(diagnostic_manager, exe_ctx))
72 return false;
73 }
74 }
75
76 return true;
77 }
78
DoCheckersExplainStop(lldb::addr_t addr,Stream & message)79 bool DynamicCheckerFunctions::DoCheckersExplainStop(lldb::addr_t addr,
80 Stream &message) {
81 // FIXME: We have to get the checkers to know why they scotched the call in
82 // more detail,
83 // so we can print a better message here.
84 if (m_valid_pointer_check && m_valid_pointer_check->ContainsAddress(addr)) {
85 message.Printf("Attempted to dereference an invalid pointer.");
86 return true;
87 } else if (m_objc_object_check &&
88 m_objc_object_check->ContainsAddress(addr)) {
89 message.Printf("Attempted to dereference an invalid ObjC Object or send it "
90 "an unrecognized selector");
91 return true;
92 }
93 return false;
94 }
95
PrintValue(llvm::Value * V,bool truncate=false)96 static std::string PrintValue(llvm::Value *V, bool truncate = false) {
97 std::string s;
98 raw_string_ostream rso(s);
99 V->print(rso);
100 rso.flush();
101 if (truncate)
102 s.resize(s.length() - 1);
103 return s;
104 }
105
106 //----------------------------------------------------------------------
107 /// @class Instrumenter IRDynamicChecks.cpp
108 /// Finds and instruments individual LLVM IR instructions
109 ///
110 /// When instrumenting LLVM IR, it is frequently desirable to first search for
111 /// instructions, and then later modify them. This way iterators remain
112 /// intact, and multiple passes can look at the same code base without
113 /// treading on each other's toes.
114 ///
115 /// The Instrumenter class implements this functionality. A client first
116 /// calls Inspect on a function, which populates a list of instructions to be
117 /// instrumented. Then, later, when all passes' Inspect functions have been
118 /// called, the client calls Instrument, which adds the desired
119 /// instrumentation.
120 ///
121 /// A subclass of Instrumenter must override InstrumentInstruction, which
122 /// is responsible for adding whatever instrumentation is necessary.
123 ///
124 /// A subclass of Instrumenter may override:
125 ///
126 /// - InspectInstruction [default: does nothing]
127 ///
128 /// - InspectBasicBlock [default: iterates through the instructions in a
129 /// basic block calling InspectInstruction]
130 ///
131 /// - InspectFunction [default: iterates through the basic blocks in a
132 /// function calling InspectBasicBlock]
133 //----------------------------------------------------------------------
134 class Instrumenter {
135 public:
136 //------------------------------------------------------------------
137 /// Constructor
138 ///
139 /// @param[in] module
140 /// The module being instrumented.
141 //------------------------------------------------------------------
Instrumenter(llvm::Module & module,DynamicCheckerFunctions & checker_functions)142 Instrumenter(llvm::Module &module, DynamicCheckerFunctions &checker_functions)
143 : m_module(module), m_checker_functions(checker_functions),
144 m_i8ptr_ty(nullptr), m_intptr_ty(nullptr) {}
145
146 virtual ~Instrumenter() = default;
147
148 //------------------------------------------------------------------
149 /// Inspect a function to find instructions to instrument
150 ///
151 /// @param[in] function
152 /// The function to inspect.
153 ///
154 /// @return
155 /// True on success; false on error.
156 //------------------------------------------------------------------
Inspect(llvm::Function & function)157 bool Inspect(llvm::Function &function) { return InspectFunction(function); }
158
159 //------------------------------------------------------------------
160 /// Instrument all the instructions found by Inspect()
161 ///
162 /// @return
163 /// True on success; false on error.
164 //------------------------------------------------------------------
Instrument()165 bool Instrument() {
166 for (InstIterator ii = m_to_instrument.begin(),
167 last_ii = m_to_instrument.end();
168 ii != last_ii; ++ii) {
169 if (!InstrumentInstruction(*ii))
170 return false;
171 }
172
173 return true;
174 }
175
176 protected:
177 //------------------------------------------------------------------
178 /// Add instrumentation to a single instruction
179 ///
180 /// @param[in] inst
181 /// The instruction to be instrumented.
182 ///
183 /// @return
184 /// True on success; false otherwise.
185 //------------------------------------------------------------------
186 virtual bool InstrumentInstruction(llvm::Instruction *inst) = 0;
187
188 //------------------------------------------------------------------
189 /// Register a single instruction to be instrumented
190 ///
191 /// @param[in] inst
192 /// The instruction to be instrumented.
193 //------------------------------------------------------------------
RegisterInstruction(llvm::Instruction & i)194 void RegisterInstruction(llvm::Instruction &i) {
195 m_to_instrument.push_back(&i);
196 }
197
198 //------------------------------------------------------------------
199 /// Determine whether a single instruction is interesting to instrument,
200 /// and, if so, call RegisterInstruction
201 ///
202 /// @param[in] i
203 /// The instruction to be inspected.
204 ///
205 /// @return
206 /// False if there was an error scanning; true otherwise.
207 //------------------------------------------------------------------
InspectInstruction(llvm::Instruction & i)208 virtual bool InspectInstruction(llvm::Instruction &i) { return true; }
209
210 //------------------------------------------------------------------
211 /// Scan a basic block to see if any instructions are interesting
212 ///
213 /// @param[in] bb
214 /// The basic block to be inspected.
215 ///
216 /// @return
217 /// False if there was an error scanning; true otherwise.
218 //------------------------------------------------------------------
InspectBasicBlock(llvm::BasicBlock & bb)219 virtual bool InspectBasicBlock(llvm::BasicBlock &bb) {
220 for (llvm::BasicBlock::iterator ii = bb.begin(), last_ii = bb.end();
221 ii != last_ii; ++ii) {
222 if (!InspectInstruction(*ii))
223 return false;
224 }
225
226 return true;
227 }
228
229 //------------------------------------------------------------------
230 /// Scan a function to see if any instructions are interesting
231 ///
232 /// @param[in] f
233 /// The function to be inspected.
234 ///
235 /// @return
236 /// False if there was an error scanning; true otherwise.
237 //------------------------------------------------------------------
InspectFunction(llvm::Function & f)238 virtual bool InspectFunction(llvm::Function &f) {
239 for (llvm::Function::iterator bbi = f.begin(), last_bbi = f.end();
240 bbi != last_bbi; ++bbi) {
241 if (!InspectBasicBlock(*bbi))
242 return false;
243 }
244
245 return true;
246 }
247
248 //------------------------------------------------------------------
249 /// Build a function pointer for a function with signature void
250 /// (*)(uint8_t*) with a given address
251 ///
252 /// @param[in] start_address
253 /// The address of the function.
254 ///
255 /// @return
256 /// The function pointer, for use in a CallInst.
257 //------------------------------------------------------------------
BuildPointerValidatorFunc(lldb::addr_t start_address)258 llvm::Value *BuildPointerValidatorFunc(lldb::addr_t start_address) {
259 llvm::Type *param_array[1];
260
261 param_array[0] = const_cast<llvm::PointerType *>(GetI8PtrTy());
262
263 ArrayRef<llvm::Type *> params(param_array, 1);
264
265 FunctionType *fun_ty = FunctionType::get(
266 llvm::Type::getVoidTy(m_module.getContext()), params, true);
267 PointerType *fun_ptr_ty = PointerType::getUnqual(fun_ty);
268 Constant *fun_addr_int =
269 ConstantInt::get(GetIntptrTy(), start_address, false);
270 return ConstantExpr::getIntToPtr(fun_addr_int, fun_ptr_ty);
271 }
272
273 //------------------------------------------------------------------
274 /// Build a function pointer for a function with signature void
275 /// (*)(uint8_t*, uint8_t*) with a given address
276 ///
277 /// @param[in] start_address
278 /// The address of the function.
279 ///
280 /// @return
281 /// The function pointer, for use in a CallInst.
282 //------------------------------------------------------------------
BuildObjectCheckerFunc(lldb::addr_t start_address)283 llvm::Value *BuildObjectCheckerFunc(lldb::addr_t start_address) {
284 llvm::Type *param_array[2];
285
286 param_array[0] = const_cast<llvm::PointerType *>(GetI8PtrTy());
287 param_array[1] = const_cast<llvm::PointerType *>(GetI8PtrTy());
288
289 ArrayRef<llvm::Type *> params(param_array, 2);
290
291 FunctionType *fun_ty = FunctionType::get(
292 llvm::Type::getVoidTy(m_module.getContext()), params, true);
293 PointerType *fun_ptr_ty = PointerType::getUnqual(fun_ty);
294 Constant *fun_addr_int =
295 ConstantInt::get(GetIntptrTy(), start_address, false);
296 return ConstantExpr::getIntToPtr(fun_addr_int, fun_ptr_ty);
297 }
298
GetI8PtrTy()299 PointerType *GetI8PtrTy() {
300 if (!m_i8ptr_ty)
301 m_i8ptr_ty = llvm::Type::getInt8PtrTy(m_module.getContext());
302
303 return m_i8ptr_ty;
304 }
305
GetIntptrTy()306 IntegerType *GetIntptrTy() {
307 if (!m_intptr_ty) {
308 llvm::DataLayout data_layout(&m_module);
309
310 m_intptr_ty = llvm::Type::getIntNTy(m_module.getContext(),
311 data_layout.getPointerSizeInBits());
312 }
313
314 return m_intptr_ty;
315 }
316
317 typedef std::vector<llvm::Instruction *> InstVector;
318 typedef InstVector::iterator InstIterator;
319
320 InstVector m_to_instrument; ///< List of instructions the inspector found
321 llvm::Module &m_module; ///< The module which is being instrumented
322 DynamicCheckerFunctions
323 &m_checker_functions; ///< The dynamic checker functions for the process
324
325 private:
326 PointerType *m_i8ptr_ty;
327 IntegerType *m_intptr_ty;
328 };
329
330 class ValidPointerChecker : public Instrumenter {
331 public:
ValidPointerChecker(llvm::Module & module,DynamicCheckerFunctions & checker_functions)332 ValidPointerChecker(llvm::Module &module,
333 DynamicCheckerFunctions &checker_functions)
334 : Instrumenter(module, checker_functions),
335 m_valid_pointer_check_func(nullptr) {}
336
337 ~ValidPointerChecker() override = default;
338
339 protected:
InstrumentInstruction(llvm::Instruction * inst)340 bool InstrumentInstruction(llvm::Instruction *inst) override {
341 Log *log(lldb_private::GetLogIfAllCategoriesSet(LIBLLDB_LOG_EXPRESSIONS));
342
343 if (log)
344 log->Printf("Instrumenting load/store instruction: %s\n",
345 PrintValue(inst).c_str());
346
347 if (!m_valid_pointer_check_func)
348 m_valid_pointer_check_func = BuildPointerValidatorFunc(
349 m_checker_functions.m_valid_pointer_check->StartAddress());
350
351 llvm::Value *dereferenced_ptr = nullptr;
352
353 if (llvm::LoadInst *li = dyn_cast<llvm::LoadInst>(inst))
354 dereferenced_ptr = li->getPointerOperand();
355 else if (llvm::StoreInst *si = dyn_cast<llvm::StoreInst>(inst))
356 dereferenced_ptr = si->getPointerOperand();
357 else
358 return false;
359
360 // Insert an instruction to cast the loaded value to int8_t*
361
362 BitCastInst *bit_cast =
363 new BitCastInst(dereferenced_ptr, GetI8PtrTy(), "", inst);
364
365 // Insert an instruction to call the helper with the result
366
367 llvm::Value *arg_array[1];
368
369 arg_array[0] = bit_cast;
370
371 llvm::ArrayRef<llvm::Value *> args(arg_array, 1);
372
373 CallInst::Create(m_valid_pointer_check_func, args, "", inst);
374
375 return true;
376 }
377
InspectInstruction(llvm::Instruction & i)378 bool InspectInstruction(llvm::Instruction &i) override {
379 if (dyn_cast<llvm::LoadInst>(&i) || dyn_cast<llvm::StoreInst>(&i))
380 RegisterInstruction(i);
381
382 return true;
383 }
384
385 private:
386 llvm::Value *m_valid_pointer_check_func;
387 };
388
389 class ObjcObjectChecker : public Instrumenter {
390 public:
ObjcObjectChecker(llvm::Module & module,DynamicCheckerFunctions & checker_functions)391 ObjcObjectChecker(llvm::Module &module,
392 DynamicCheckerFunctions &checker_functions)
393 : Instrumenter(module, checker_functions),
394 m_objc_object_check_func(nullptr) {}
395
396 ~ObjcObjectChecker() override = default;
397
398 enum msgSend_type {
399 eMsgSend = 0,
400 eMsgSendSuper,
401 eMsgSendSuper_stret,
402 eMsgSend_fpret,
403 eMsgSend_stret
404 };
405
406 std::map<llvm::Instruction *, msgSend_type> msgSend_types;
407
408 protected:
InstrumentInstruction(llvm::Instruction * inst)409 bool InstrumentInstruction(llvm::Instruction *inst) override {
410 CallInst *call_inst = dyn_cast<CallInst>(inst);
411
412 if (!call_inst)
413 return false; // call_inst really shouldn't be nullptr, because otherwise
414 // InspectInstruction wouldn't have registered it
415
416 if (!m_objc_object_check_func)
417 m_objc_object_check_func = BuildObjectCheckerFunc(
418 m_checker_functions.m_objc_object_check->StartAddress());
419
420 // id objc_msgSend(id theReceiver, SEL theSelector, ...)
421
422 llvm::Value *target_object;
423 llvm::Value *selector;
424
425 switch (msgSend_types[inst]) {
426 case eMsgSend:
427 case eMsgSend_fpret:
428 target_object = call_inst->getArgOperand(0);
429 selector = call_inst->getArgOperand(1);
430 break;
431 case eMsgSend_stret:
432 target_object = call_inst->getArgOperand(1);
433 selector = call_inst->getArgOperand(2);
434 break;
435 case eMsgSendSuper:
436 case eMsgSendSuper_stret:
437 return true;
438 }
439
440 // These objects should always be valid according to Sean Calannan
441 assert(target_object);
442 assert(selector);
443
444 // Insert an instruction to cast the receiver id to int8_t*
445
446 BitCastInst *bit_cast =
447 new BitCastInst(target_object, GetI8PtrTy(), "", inst);
448
449 // Insert an instruction to call the helper with the result
450
451 llvm::Value *arg_array[2];
452
453 arg_array[0] = bit_cast;
454 arg_array[1] = selector;
455
456 ArrayRef<llvm::Value *> args(arg_array, 2);
457
458 CallInst::Create(m_objc_object_check_func, args, "", inst);
459
460 return true;
461 }
462
GetFunction(llvm::Value * value)463 static llvm::Function *GetFunction(llvm::Value *value) {
464 if (llvm::Function *function = llvm::dyn_cast<llvm::Function>(value)) {
465 return function;
466 }
467
468 if (llvm::ConstantExpr *const_expr =
469 llvm::dyn_cast<llvm::ConstantExpr>(value)) {
470 switch (const_expr->getOpcode()) {
471 default:
472 return nullptr;
473 case llvm::Instruction::BitCast:
474 return GetFunction(const_expr->getOperand(0));
475 }
476 }
477
478 return nullptr;
479 }
480
GetCalledFunction(llvm::CallInst * inst)481 static llvm::Function *GetCalledFunction(llvm::CallInst *inst) {
482 return GetFunction(inst->getCalledValue());
483 }
484
InspectInstruction(llvm::Instruction & i)485 bool InspectInstruction(llvm::Instruction &i) override {
486 Log *log(lldb_private::GetLogIfAllCategoriesSet(LIBLLDB_LOG_EXPRESSIONS));
487
488 CallInst *call_inst = dyn_cast<CallInst>(&i);
489
490 if (call_inst) {
491 const llvm::Function *called_function = GetCalledFunction(call_inst);
492
493 if (!called_function)
494 return true;
495
496 std::string name_str = called_function->getName().str();
497 const char *name_cstr = name_str.c_str();
498
499 if (log)
500 log->Printf("Found call to %s: %s\n", name_cstr,
501 PrintValue(call_inst).c_str());
502
503 if (name_str.find("objc_msgSend") == std::string::npos)
504 return true;
505
506 if (!strcmp(name_cstr, "objc_msgSend")) {
507 RegisterInstruction(i);
508 msgSend_types[&i] = eMsgSend;
509 return true;
510 }
511
512 if (!strcmp(name_cstr, "objc_msgSend_stret")) {
513 RegisterInstruction(i);
514 msgSend_types[&i] = eMsgSend_stret;
515 return true;
516 }
517
518 if (!strcmp(name_cstr, "objc_msgSend_fpret")) {
519 RegisterInstruction(i);
520 msgSend_types[&i] = eMsgSend_fpret;
521 return true;
522 }
523
524 if (!strcmp(name_cstr, "objc_msgSendSuper")) {
525 RegisterInstruction(i);
526 msgSend_types[&i] = eMsgSendSuper;
527 return true;
528 }
529
530 if (!strcmp(name_cstr, "objc_msgSendSuper_stret")) {
531 RegisterInstruction(i);
532 msgSend_types[&i] = eMsgSendSuper_stret;
533 return true;
534 }
535
536 if (log)
537 log->Printf(
538 "Function name '%s' contains 'objc_msgSend' but is not handled",
539 name_str.c_str());
540
541 return true;
542 }
543
544 return true;
545 }
546
547 private:
548 llvm::Value *m_objc_object_check_func;
549 };
550
IRDynamicChecks(DynamicCheckerFunctions & checker_functions,const char * func_name)551 IRDynamicChecks::IRDynamicChecks(DynamicCheckerFunctions &checker_functions,
552 const char *func_name)
553 : ModulePass(ID), m_func_name(func_name),
554 m_checker_functions(checker_functions) {}
555
556 IRDynamicChecks::~IRDynamicChecks() = default;
557
runOnModule(llvm::Module & M)558 bool IRDynamicChecks::runOnModule(llvm::Module &M) {
559 Log *log(lldb_private::GetLogIfAllCategoriesSet(LIBLLDB_LOG_EXPRESSIONS));
560
561 llvm::Function *function = M.getFunction(StringRef(m_func_name));
562
563 if (!function) {
564 if (log)
565 log->Printf("Couldn't find %s() in the module", m_func_name.c_str());
566
567 return false;
568 }
569
570 if (m_checker_functions.m_valid_pointer_check) {
571 ValidPointerChecker vpc(M, m_checker_functions);
572
573 if (!vpc.Inspect(*function))
574 return false;
575
576 if (!vpc.Instrument())
577 return false;
578 }
579
580 if (m_checker_functions.m_objc_object_check) {
581 ObjcObjectChecker ooc(M, m_checker_functions);
582
583 if (!ooc.Inspect(*function))
584 return false;
585
586 if (!ooc.Instrument())
587 return false;
588 }
589
590 if (log && log->GetVerbose()) {
591 std::string s;
592 raw_string_ostream oss(s);
593
594 M.print(oss, nullptr);
595
596 oss.flush();
597
598 log->Printf("Module after dynamic checks: \n%s", s.c_str());
599 }
600
601 return true;
602 }
603
assignPassManager(PMStack & PMS,PassManagerType T)604 void IRDynamicChecks::assignPassManager(PMStack &PMS, PassManagerType T) {}
605
getPotentialPassManagerType() const606 PassManagerType IRDynamicChecks::getPotentialPassManagerType() const {
607 return PMT_ModulePassManager;
608 }
609