1 //===-- DynamicLoaderDarwin.cpp -----------------------------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
10 #include "DynamicLoaderDarwin.h"
11 
12 #include "lldb/Breakpoint/StoppointCallbackContext.h"
13 #include "lldb/Core/Debugger.h"
14 #include "lldb/Core/Module.h"
15 #include "lldb/Core/ModuleSpec.h"
16 #include "lldb/Core/PluginManager.h"
17 #include "lldb/Core/Section.h"
18 #include "lldb/Expression/DiagnosticManager.h"
19 #include "lldb/Host/FileSystem.h"
20 #include "lldb/Symbol/ClangASTContext.h"
21 #include "lldb/Symbol/Function.h"
22 #include "lldb/Symbol/ObjectFile.h"
23 #include "lldb/Target/ABI.h"
24 #include "lldb/Target/ObjCLanguageRuntime.h"
25 #include "lldb/Target/RegisterContext.h"
26 #include "lldb/Target/StackFrame.h"
27 #include "lldb/Target/Target.h"
28 #include "lldb/Target/Thread.h"
29 #include "lldb/Target/ThreadPlanCallFunction.h"
30 #include "lldb/Target/ThreadPlanRunToAddress.h"
31 #include "lldb/Utility/DataBuffer.h"
32 #include "lldb/Utility/DataBufferHeap.h"
33 #include "lldb/Utility/Log.h"
34 #include "lldb/Utility/State.h"
35 
36 //#define ENABLE_DEBUG_PRINTF // COMMENT THIS LINE OUT PRIOR TO CHECKIN
37 #ifdef ENABLE_DEBUG_PRINTF
38 #include <stdio.h>
39 #define DEBUG_PRINTF(fmt, ...) printf(fmt, ##__VA_ARGS__)
40 #else
41 #define DEBUG_PRINTF(fmt, ...)
42 #endif
43 
44 #ifndef __APPLE__
45 #include "Utility/UuidCompatibility.h"
46 #else
47 #include <uuid/uuid.h>
48 #endif
49 
50 using namespace lldb;
51 using namespace lldb_private;
52 
53 //----------------------------------------------------------------------
54 // Constructor
55 //----------------------------------------------------------------------
56 DynamicLoaderDarwin::DynamicLoaderDarwin(Process *process)
57     : DynamicLoader(process), m_dyld_module_wp(), m_libpthread_module_wp(),
58       m_pthread_getspecific_addr(), m_tid_to_tls_map(), m_dyld_image_infos(),
59       m_dyld_image_infos_stop_id(UINT32_MAX), m_dyld(), m_mutex() {}
60 
61 //----------------------------------------------------------------------
62 // Destructor
63 //----------------------------------------------------------------------
64 DynamicLoaderDarwin::~DynamicLoaderDarwin() {}
65 
66 //------------------------------------------------------------------
67 /// Called after attaching a process.
68 ///
69 /// Allow DynamicLoader plug-ins to execute some code after
70 /// attaching to a process.
71 //------------------------------------------------------------------
72 void DynamicLoaderDarwin::DidAttach() {
73   PrivateInitialize(m_process);
74   DoInitialImageFetch();
75   SetNotificationBreakpoint();
76 }
77 
78 //------------------------------------------------------------------
79 /// Called after attaching a process.
80 ///
81 /// Allow DynamicLoader plug-ins to execute some code after
82 /// attaching to a process.
83 //------------------------------------------------------------------
84 void DynamicLoaderDarwin::DidLaunch() {
85   PrivateInitialize(m_process);
86   DoInitialImageFetch();
87   SetNotificationBreakpoint();
88 }
89 
90 //----------------------------------------------------------------------
91 // Clear out the state of this class.
92 //----------------------------------------------------------------------
93 void DynamicLoaderDarwin::Clear(bool clear_process) {
94   std::lock_guard<std::recursive_mutex> guard(m_mutex);
95   if (clear_process)
96     m_process = NULL;
97   m_dyld_image_infos.clear();
98   m_dyld_image_infos_stop_id = UINT32_MAX;
99   m_dyld.Clear(false);
100 }
101 
102 ModuleSP DynamicLoaderDarwin::FindTargetModuleForImageInfo(
103     ImageInfo &image_info, bool can_create, bool *did_create_ptr) {
104   if (did_create_ptr)
105     *did_create_ptr = false;
106 
107   Target &target = m_process->GetTarget();
108   const ModuleList &target_images = target.GetImages();
109   ModuleSpec module_spec(image_info.file_spec);
110   module_spec.GetUUID() = image_info.uuid;
111   ModuleSP module_sp(target_images.FindFirstModule(module_spec));
112 
113   if (module_sp && !module_spec.GetUUID().IsValid() &&
114       !module_sp->GetUUID().IsValid()) {
115     // No UUID, we must rely upon the cached module modification time and the
116     // modification time of the file on disk
117     if (module_sp->GetModificationTime() !=
118         FileSystem::Instance().GetModificationTime(module_sp->GetFileSpec()))
119       module_sp.reset();
120   }
121 
122   if (!module_sp) {
123     if (can_create) {
124       module_sp = target.GetSharedModule(module_spec);
125       if (!module_sp || module_sp->GetObjectFile() == NULL)
126         module_sp = m_process->ReadModuleFromMemory(image_info.file_spec,
127                                                     image_info.address);
128 
129       if (did_create_ptr)
130         *did_create_ptr = (bool)module_sp;
131     }
132   }
133   return module_sp;
134 }
135 
136 void DynamicLoaderDarwin::UnloadImages(
137     const std::vector<lldb::addr_t> &solib_addresses) {
138   std::lock_guard<std::recursive_mutex> guard(m_mutex);
139   if (m_process->GetStopID() == m_dyld_image_infos_stop_id)
140     return;
141 
142   Log *log(lldb_private::GetLogIfAnyCategoriesSet(LIBLLDB_LOG_DYNAMIC_LOADER));
143   Target &target = m_process->GetTarget();
144   if (log)
145     log->Printf("Removing %" PRId64 " modules.",
146                 (uint64_t)solib_addresses.size());
147 
148   ModuleList unloaded_module_list;
149 
150   for (addr_t solib_addr : solib_addresses) {
151     Address header;
152     if (header.SetLoadAddress(solib_addr, &target)) {
153       if (header.GetOffset() == 0) {
154         ModuleSP module_to_remove(header.GetModule());
155         if (module_to_remove.get()) {
156           if (log)
157             log->Printf("Removing module at address 0x%" PRIx64, solib_addr);
158           // remove the sections from the Target
159           UnloadSections(module_to_remove);
160           // add this to the list of modules to remove
161           unloaded_module_list.AppendIfNeeded(module_to_remove);
162           // remove the entry from the m_dyld_image_infos
163           ImageInfo::collection::iterator pos, end = m_dyld_image_infos.end();
164           for (pos = m_dyld_image_infos.begin(); pos != end; pos++) {
165             if (solib_addr == (*pos).address) {
166               m_dyld_image_infos.erase(pos);
167               break;
168             }
169           }
170         }
171       }
172     }
173   }
174 
175   if (unloaded_module_list.GetSize() > 0) {
176     if (log) {
177       log->PutCString("Unloaded:");
178       unloaded_module_list.LogUUIDAndPaths(
179           log, "DynamicLoaderDarwin::UnloadModules");
180     }
181     m_process->GetTarget().GetImages().Remove(unloaded_module_list);
182     m_dyld_image_infos_stop_id = m_process->GetStopID();
183   }
184 }
185 
186 void DynamicLoaderDarwin::UnloadAllImages() {
187   Log *log(lldb_private::GetLogIfAnyCategoriesSet(LIBLLDB_LOG_DYNAMIC_LOADER));
188   ModuleList unloaded_modules_list;
189 
190   Target &target = m_process->GetTarget();
191   const ModuleList &target_modules = target.GetImages();
192   std::lock_guard<std::recursive_mutex> guard(target_modules.GetMutex());
193 
194   size_t num_modules = target_modules.GetSize();
195   ModuleSP dyld_sp(GetDYLDModule());
196 
197   for (size_t i = 0; i < num_modules; i++) {
198     ModuleSP module_sp = target_modules.GetModuleAtIndexUnlocked(i);
199 
200     // Don't remove dyld - else we'll lose our breakpoint notifying us about
201     // libraries being re-loaded...
202     if (module_sp.get() != nullptr && module_sp.get() != dyld_sp.get()) {
203       UnloadSections(module_sp);
204       unloaded_modules_list.Append(module_sp);
205     }
206   }
207 
208   if (unloaded_modules_list.GetSize() != 0) {
209     if (log) {
210       log->PutCString("Unloaded:");
211       unloaded_modules_list.LogUUIDAndPaths(
212           log, "DynamicLoaderDarwin::UnloadAllImages");
213     }
214     target.GetImages().Remove(unloaded_modules_list);
215     m_dyld_image_infos.clear();
216     m_dyld_image_infos_stop_id = m_process->GetStopID();
217   }
218 }
219 
220 //----------------------------------------------------------------------
221 // Update the load addresses for all segments in MODULE using the updated INFO
222 // that is passed in.
223 //----------------------------------------------------------------------
224 bool DynamicLoaderDarwin::UpdateImageLoadAddress(Module *module,
225                                                  ImageInfo &info) {
226   bool changed = false;
227   if (module) {
228     ObjectFile *image_object_file = module->GetObjectFile();
229     if (image_object_file) {
230       SectionList *section_list = image_object_file->GetSectionList();
231       if (section_list) {
232         std::vector<uint32_t> inaccessible_segment_indexes;
233         // We now know the slide amount, so go through all sections and update
234         // the load addresses with the correct values.
235         const size_t num_segments = info.segments.size();
236         for (size_t i = 0; i < num_segments; ++i) {
237           // Only load a segment if it has protections. Things like __PAGEZERO
238           // don't have any protections, and they shouldn't be slid
239           SectionSP section_sp(
240               section_list->FindSectionByName(info.segments[i].name));
241 
242           if (info.segments[i].maxprot == 0) {
243             inaccessible_segment_indexes.push_back(i);
244           } else {
245             const addr_t new_section_load_addr =
246                 info.segments[i].vmaddr + info.slide;
247             static ConstString g_section_name_LINKEDIT("__LINKEDIT");
248 
249             if (section_sp) {
250               // __LINKEDIT sections from files in the shared cache can overlap
251               // so check to see what the segment name is and pass "false" so
252               // we don't warn of overlapping "Section" objects, and "true" for
253               // all other sections.
254               const bool warn_multiple =
255                   section_sp->GetName() != g_section_name_LINKEDIT;
256 
257               changed = m_process->GetTarget().SetSectionLoadAddress(
258                   section_sp, new_section_load_addr, warn_multiple);
259             } else {
260               Host::SystemLog(
261                   Host::eSystemLogWarning,
262                   "warning: unable to find and load segment named '%s' at "
263                   "0x%" PRIx64 " in '%s' in macosx dynamic loader plug-in.\n",
264                   info.segments[i].name.AsCString("<invalid>"),
265                   (uint64_t)new_section_load_addr,
266                   image_object_file->GetFileSpec().GetPath().c_str());
267             }
268           }
269         }
270 
271         // If the loaded the file (it changed) and we have segments that are
272         // not readable or writeable, add them to the invalid memory region
273         // cache for the process. This will typically only be the __PAGEZERO
274         // segment in the main executable. We might be able to apply this more
275         // generally to more sections that have no protections in the future,
276         // but for now we are going to just do __PAGEZERO.
277         if (changed && !inaccessible_segment_indexes.empty()) {
278           for (uint32_t i = 0; i < inaccessible_segment_indexes.size(); ++i) {
279             const uint32_t seg_idx = inaccessible_segment_indexes[i];
280             SectionSP section_sp(
281                 section_list->FindSectionByName(info.segments[seg_idx].name));
282 
283             if (section_sp) {
284               static ConstString g_pagezero_section_name("__PAGEZERO");
285               if (g_pagezero_section_name == section_sp->GetName()) {
286                 // __PAGEZERO never slides...
287                 const lldb::addr_t vmaddr = info.segments[seg_idx].vmaddr;
288                 const lldb::addr_t vmsize = info.segments[seg_idx].vmsize;
289                 Process::LoadRange pagezero_range(vmaddr, vmsize);
290                 m_process->AddInvalidMemoryRegion(pagezero_range);
291               }
292             }
293           }
294         }
295       }
296     }
297   }
298   // We might have an in memory image that was loaded as soon as it was created
299   if (info.load_stop_id == m_process->GetStopID())
300     changed = true;
301   else if (changed) {
302     // Update the stop ID when this library was updated
303     info.load_stop_id = m_process->GetStopID();
304   }
305   return changed;
306 }
307 
308 //----------------------------------------------------------------------
309 // Unload the segments in MODULE using the INFO that is passed in.
310 //----------------------------------------------------------------------
311 bool DynamicLoaderDarwin::UnloadModuleSections(Module *module,
312                                                ImageInfo &info) {
313   bool changed = false;
314   if (module) {
315     ObjectFile *image_object_file = module->GetObjectFile();
316     if (image_object_file) {
317       SectionList *section_list = image_object_file->GetSectionList();
318       if (section_list) {
319         const size_t num_segments = info.segments.size();
320         for (size_t i = 0; i < num_segments; ++i) {
321           SectionSP section_sp(
322               section_list->FindSectionByName(info.segments[i].name));
323           if (section_sp) {
324             const addr_t old_section_load_addr =
325                 info.segments[i].vmaddr + info.slide;
326             if (m_process->GetTarget().SetSectionUnloaded(
327                     section_sp, old_section_load_addr))
328               changed = true;
329           } else {
330             Host::SystemLog(Host::eSystemLogWarning,
331                             "warning: unable to find and unload segment named "
332                             "'%s' in '%s' in macosx dynamic loader plug-in.\n",
333                             info.segments[i].name.AsCString("<invalid>"),
334                             image_object_file->GetFileSpec().GetPath().c_str());
335           }
336         }
337       }
338     }
339   }
340   return changed;
341 }
342 
343 // Given a JSON dictionary (from debugserver, most likely) of binary images
344 // loaded in the inferior process, add the images to the ImageInfo collection.
345 
346 bool DynamicLoaderDarwin::JSONImageInformationIntoImageInfo(
347     StructuredData::ObjectSP image_details,
348     ImageInfo::collection &image_infos) {
349   StructuredData::ObjectSP images_sp =
350       image_details->GetAsDictionary()->GetValueForKey("images");
351   if (images_sp.get() == nullptr)
352     return false;
353 
354   image_infos.resize(images_sp->GetAsArray()->GetSize());
355 
356   for (size_t i = 0; i < image_infos.size(); i++) {
357     StructuredData::ObjectSP image_sp =
358         images_sp->GetAsArray()->GetItemAtIndex(i);
359     if (image_sp.get() == nullptr || image_sp->GetAsDictionary() == nullptr)
360       return false;
361     StructuredData::Dictionary *image = image_sp->GetAsDictionary();
362     if (image->HasKey("load_address") == false ||
363         image->HasKey("pathname") == false ||
364         image->HasKey("mod_date") == false ||
365         image->HasKey("mach_header") == false ||
366         image->GetValueForKey("mach_header")->GetAsDictionary() == nullptr ||
367         image->HasKey("segments") == false ||
368         image->GetValueForKey("segments")->GetAsArray() == nullptr ||
369         image->HasKey("uuid") == false) {
370       return false;
371     }
372     image_infos[i].address =
373         image->GetValueForKey("load_address")->GetAsInteger()->GetValue();
374     image_infos[i].mod_date =
375         image->GetValueForKey("mod_date")->GetAsInteger()->GetValue();
376     image_infos[i].file_spec.SetFile(
377         image->GetValueForKey("pathname")->GetAsString()->GetValue(),
378         FileSpec::Style::native);
379 
380     StructuredData::Dictionary *mh =
381         image->GetValueForKey("mach_header")->GetAsDictionary();
382     image_infos[i].header.magic =
383         mh->GetValueForKey("magic")->GetAsInteger()->GetValue();
384     image_infos[i].header.cputype =
385         mh->GetValueForKey("cputype")->GetAsInteger()->GetValue();
386     image_infos[i].header.cpusubtype =
387         mh->GetValueForKey("cpusubtype")->GetAsInteger()->GetValue();
388     image_infos[i].header.filetype =
389         mh->GetValueForKey("filetype")->GetAsInteger()->GetValue();
390 
391     if (image->HasKey("min_version_os_name")) {
392       std::string os_name = image->GetValueForKey("min_version_os_name")
393                                 ->GetAsString()
394                                 ->GetValue();
395       if (os_name == "macosx")
396         image_infos[i].os_type = llvm::Triple::MacOSX;
397       else if (os_name == "ios" || os_name == "iphoneos")
398         image_infos[i].os_type = llvm::Triple::IOS;
399       else if (os_name == "tvos")
400         image_infos[i].os_type = llvm::Triple::TvOS;
401       else if (os_name == "watchos")
402         image_infos[i].os_type = llvm::Triple::WatchOS;
403       // NEED_BRIDGEOS_TRIPLE else if (os_name == "bridgeos")
404       // NEED_BRIDGEOS_TRIPLE   image_infos[i].os_type = llvm::Triple::BridgeOS;
405     }
406     if (image->HasKey("min_version_os_sdk")) {
407       image_infos[i].min_version_os_sdk =
408           image->GetValueForKey("min_version_os_sdk")
409               ->GetAsString()
410               ->GetValue();
411     }
412 
413     // Fields that aren't used by DynamicLoaderDarwin so debugserver doesn't
414     // currently send them in the reply.
415 
416     if (mh->HasKey("flags"))
417       image_infos[i].header.flags =
418           mh->GetValueForKey("flags")->GetAsInteger()->GetValue();
419     else
420       image_infos[i].header.flags = 0;
421 
422     if (mh->HasKey("ncmds"))
423       image_infos[i].header.ncmds =
424           mh->GetValueForKey("ncmds")->GetAsInteger()->GetValue();
425     else
426       image_infos[i].header.ncmds = 0;
427 
428     if (mh->HasKey("sizeofcmds"))
429       image_infos[i].header.sizeofcmds =
430           mh->GetValueForKey("sizeofcmds")->GetAsInteger()->GetValue();
431     else
432       image_infos[i].header.sizeofcmds = 0;
433 
434     StructuredData::Array *segments =
435         image->GetValueForKey("segments")->GetAsArray();
436     uint32_t segcount = segments->GetSize();
437     for (size_t j = 0; j < segcount; j++) {
438       Segment segment;
439       StructuredData::Dictionary *seg =
440           segments->GetItemAtIndex(j)->GetAsDictionary();
441       segment.name =
442           ConstString(seg->GetValueForKey("name")->GetAsString()->GetValue());
443       segment.vmaddr =
444           seg->GetValueForKey("vmaddr")->GetAsInteger()->GetValue();
445       segment.vmsize =
446           seg->GetValueForKey("vmsize")->GetAsInteger()->GetValue();
447       segment.fileoff =
448           seg->GetValueForKey("fileoff")->GetAsInteger()->GetValue();
449       segment.filesize =
450           seg->GetValueForKey("filesize")->GetAsInteger()->GetValue();
451       segment.maxprot =
452           seg->GetValueForKey("maxprot")->GetAsInteger()->GetValue();
453 
454       // Fields that aren't used by DynamicLoaderDarwin so debugserver doesn't
455       // currently send them in the reply.
456 
457       if (seg->HasKey("initprot"))
458         segment.initprot =
459             seg->GetValueForKey("initprot")->GetAsInteger()->GetValue();
460       else
461         segment.initprot = 0;
462 
463       if (seg->HasKey("flags"))
464         segment.flags =
465             seg->GetValueForKey("flags")->GetAsInteger()->GetValue();
466       else
467         segment.flags = 0;
468 
469       if (seg->HasKey("nsects"))
470         segment.nsects =
471             seg->GetValueForKey("nsects")->GetAsInteger()->GetValue();
472       else
473         segment.nsects = 0;
474 
475       image_infos[i].segments.push_back(segment);
476     }
477 
478     image_infos[i].uuid.SetFromStringRef(
479         image->GetValueForKey("uuid")->GetAsString()->GetValue());
480 
481     // All sections listed in the dyld image info structure will all either be
482     // fixed up already, or they will all be off by a single slide amount that
483     // is determined by finding the first segment that is at file offset zero
484     // which also has bytes (a file size that is greater than zero) in the
485     // object file.
486 
487     // Determine the slide amount (if any)
488     const size_t num_sections = image_infos[i].segments.size();
489     for (size_t k = 0; k < num_sections; ++k) {
490       // Iterate through the object file sections to find the first section
491       // that starts of file offset zero and that has bytes in the file...
492       if ((image_infos[i].segments[k].fileoff == 0 &&
493            image_infos[i].segments[k].filesize > 0) ||
494           (image_infos[i].segments[k].name == ConstString("__TEXT"))) {
495         image_infos[i].slide =
496             image_infos[i].address - image_infos[i].segments[k].vmaddr;
497         // We have found the slide amount, so we can exit this for loop.
498         break;
499       }
500     }
501   }
502 
503   return true;
504 }
505 
506 void DynamicLoaderDarwin::UpdateSpecialBinariesFromNewImageInfos(
507     ImageInfo::collection &image_infos) {
508   uint32_t exe_idx = UINT32_MAX;
509   uint32_t dyld_idx = UINT32_MAX;
510   Target &target = m_process->GetTarget();
511   Log *log(lldb_private::GetLogIfAnyCategoriesSet(LIBLLDB_LOG_DYNAMIC_LOADER));
512   ConstString g_dyld_sim_filename("dyld_sim");
513 
514   ArchSpec target_arch = target.GetArchitecture();
515   const size_t image_infos_size = image_infos.size();
516   for (size_t i = 0; i < image_infos_size; i++) {
517     if (image_infos[i].header.filetype == llvm::MachO::MH_DYLINKER) {
518       // In a "simulator" process (an x86 process that is
519       // ios/tvos/watchos/bridgeos) we will have two dyld modules --
520       // a "dyld" that we want to keep track of, and a "dyld_sim" which
521       // we don't need to keep track of here. If the target is an x86
522       // system and the OS of the dyld binary is ios/tvos/watchos/bridgeos,
523       // then we are looking at dyld_sym.
524 
525       // debugserver has only recently (late 2016) started sending up the os
526       // type for each binary it sees -- so if we don't have an os type, use a
527       // filename check as our next best guess.
528       if (image_infos[i].os_type == llvm::Triple::OSType::UnknownOS) {
529         if (image_infos[i].file_spec.GetFilename() != g_dyld_sim_filename) {
530           dyld_idx = i;
531         }
532       } else if (target_arch.GetTriple().getArch() == llvm::Triple::x86 ||
533                  target_arch.GetTriple().getArch() == llvm::Triple::x86_64) {
534         if (image_infos[i].os_type != llvm::Triple::OSType::IOS &&
535             image_infos[i].os_type != llvm::Triple::TvOS &&
536             image_infos[i].os_type != llvm::Triple::WatchOS) {
537             // NEED_BRIDGEOS_TRIPLE image_infos[i].os_type != llvm::Triple::BridgeOS) {
538           dyld_idx = i;
539         }
540       }
541       else {
542         // catch-all for any other environment -- trust that dyld is actually
543         // dyld
544         dyld_idx = i;
545       }
546     } else if (image_infos[i].header.filetype == llvm::MachO::MH_EXECUTE) {
547       exe_idx = i;
548     }
549   }
550 
551   if (exe_idx != UINT32_MAX) {
552     const bool can_create = true;
553     ModuleSP exe_module_sp(
554         FindTargetModuleForImageInfo(image_infos[exe_idx], can_create, NULL));
555     if (exe_module_sp) {
556       if (log)
557         log->Printf("Found executable module: %s",
558                     exe_module_sp->GetFileSpec().GetPath().c_str());
559       target.GetImages().AppendIfNeeded(exe_module_sp);
560       UpdateImageLoadAddress(exe_module_sp.get(), image_infos[exe_idx]);
561       if (exe_module_sp.get() != target.GetExecutableModulePointer()) {
562         target.SetExecutableModule(exe_module_sp, eLoadDependentsNo);
563       }
564     }
565   }
566 
567   if (dyld_idx != UINT32_MAX) {
568     const bool can_create = true;
569     ModuleSP dyld_sp =
570         FindTargetModuleForImageInfo(image_infos[dyld_idx], can_create, NULL);
571     if (dyld_sp.get()) {
572       if (log)
573         log->Printf("Found dyld module: %s",
574                     dyld_sp->GetFileSpec().GetPath().c_str());
575       target.GetImages().AppendIfNeeded(dyld_sp);
576       UpdateImageLoadAddress(dyld_sp.get(), image_infos[dyld_idx]);
577       SetDYLDModule(dyld_sp);
578     }
579   }
580 }
581 
582 void DynamicLoaderDarwin::UpdateDYLDImageInfoFromNewImageInfo(
583     ImageInfo &image_info) {
584   if (image_info.header.filetype == llvm::MachO::MH_DYLINKER) {
585     const bool can_create = true;
586     ModuleSP dyld_sp =
587         FindTargetModuleForImageInfo(image_info, can_create, NULL);
588     if (dyld_sp.get()) {
589       Target &target = m_process->GetTarget();
590       target.GetImages().AppendIfNeeded(dyld_sp);
591       UpdateImageLoadAddress(dyld_sp.get(), image_info);
592       SetDYLDModule(dyld_sp);
593     }
594   }
595 }
596 
597 void DynamicLoaderDarwin::SetDYLDModule(lldb::ModuleSP &dyld_module_sp) {
598   m_dyld_module_wp = dyld_module_sp;
599 }
600 
601 ModuleSP DynamicLoaderDarwin::GetDYLDModule() {
602   ModuleSP dyld_sp(m_dyld_module_wp.lock());
603   return dyld_sp;
604 }
605 
606 bool DynamicLoaderDarwin::AddModulesUsingImageInfos(
607     ImageInfo::collection &image_infos) {
608   std::lock_guard<std::recursive_mutex> guard(m_mutex);
609   // Now add these images to the main list.
610   ModuleList loaded_module_list;
611   Log *log(lldb_private::GetLogIfAnyCategoriesSet(LIBLLDB_LOG_DYNAMIC_LOADER));
612   Target &target = m_process->GetTarget();
613   ModuleList &target_images = target.GetImages();
614 
615   for (uint32_t idx = 0; idx < image_infos.size(); ++idx) {
616     if (log) {
617       log->Printf("Adding new image at address=0x%16.16" PRIx64 ".",
618                   image_infos[idx].address);
619       image_infos[idx].PutToLog(log);
620     }
621 
622     m_dyld_image_infos.push_back(image_infos[idx]);
623 
624     ModuleSP image_module_sp(
625         FindTargetModuleForImageInfo(image_infos[idx], true, NULL));
626 
627     if (image_module_sp) {
628       ObjectFile *objfile = image_module_sp->GetObjectFile();
629       if (objfile) {
630         SectionList *sections = objfile->GetSectionList();
631         if (sections) {
632           ConstString commpage_dbstr("__commpage");
633           Section *commpage_section =
634               sections->FindSectionByName(commpage_dbstr).get();
635           if (commpage_section) {
636             ModuleSpec module_spec(objfile->GetFileSpec(),
637                                    image_infos[idx].GetArchitecture());
638             module_spec.GetObjectName() = commpage_dbstr;
639             ModuleSP commpage_image_module_sp(
640                 target_images.FindFirstModule(module_spec));
641             if (!commpage_image_module_sp) {
642               module_spec.SetObjectOffset(objfile->GetFileOffset() +
643                                           commpage_section->GetFileOffset());
644               module_spec.SetObjectSize(objfile->GetByteSize());
645               commpage_image_module_sp = target.GetSharedModule(module_spec);
646               if (!commpage_image_module_sp ||
647                   commpage_image_module_sp->GetObjectFile() == NULL) {
648                 commpage_image_module_sp = m_process->ReadModuleFromMemory(
649                     image_infos[idx].file_spec, image_infos[idx].address);
650                 // Always load a memory image right away in the target in case
651                 // we end up trying to read the symbol table from memory... The
652                 // __LINKEDIT will need to be mapped so we can figure out where
653                 // the symbol table bits are...
654                 bool changed = false;
655                 UpdateImageLoadAddress(commpage_image_module_sp.get(),
656                                        image_infos[idx]);
657                 target.GetImages().Append(commpage_image_module_sp);
658                 if (changed) {
659                   image_infos[idx].load_stop_id = m_process->GetStopID();
660                   loaded_module_list.AppendIfNeeded(commpage_image_module_sp);
661                 }
662               }
663             }
664           }
665         }
666       }
667 
668       // UpdateImageLoadAddress will return true if any segments change load
669       // address. We need to check this so we don't mention that all loaded
670       // shared libraries are newly loaded each time we hit out dyld breakpoint
671       // since dyld will list all shared libraries each time.
672       if (UpdateImageLoadAddress(image_module_sp.get(), image_infos[idx])) {
673         target_images.AppendIfNeeded(image_module_sp);
674         loaded_module_list.AppendIfNeeded(image_module_sp);
675       }
676     }
677   }
678 
679   if (loaded_module_list.GetSize() > 0) {
680     if (log)
681       loaded_module_list.LogUUIDAndPaths(log,
682                                          "DynamicLoaderDarwin::ModulesDidLoad");
683     m_process->GetTarget().ModulesDidLoad(loaded_module_list);
684   }
685   return true;
686 }
687 
688 //----------------------------------------------------------------------
689 // On Mac OS X libobjc (the Objective-C runtime) has several critical dispatch
690 // functions written in hand-written assembly, and also have hand-written
691 // unwind information in the eh_frame section.  Normally we prefer analyzing
692 // the assembly instructions of a currently executing frame to unwind from that
693 // frame -- but on hand-written functions this profiling can fail.  We should
694 // use the eh_frame instructions for these functions all the time.
695 //
696 // As an aside, it would be better if the eh_frame entries had a flag (or were
697 // extensible so they could have an Apple-specific flag) which indicates that
698 // the instructions are asynchronous -- accurate at every instruction, instead
699 // of our normal default assumption that they are not.
700 //----------------------------------------------------------------------
701 
702 bool DynamicLoaderDarwin::AlwaysRelyOnEHUnwindInfo(SymbolContext &sym_ctx) {
703   ModuleSP module_sp;
704   if (sym_ctx.symbol) {
705     module_sp = sym_ctx.symbol->GetAddressRef().GetModule();
706   }
707   if (module_sp.get() == NULL && sym_ctx.function) {
708     module_sp =
709         sym_ctx.function->GetAddressRange().GetBaseAddress().GetModule();
710   }
711   if (module_sp.get() == NULL)
712     return false;
713 
714   ObjCLanguageRuntime *objc_runtime = m_process->GetObjCLanguageRuntime();
715   if (objc_runtime != NULL && objc_runtime->IsModuleObjCLibrary(module_sp)) {
716     return true;
717   }
718 
719   return false;
720 }
721 
722 //----------------------------------------------------------------------
723 // Dump a Segment to the file handle provided.
724 //----------------------------------------------------------------------
725 void DynamicLoaderDarwin::Segment::PutToLog(Log *log,
726                                             lldb::addr_t slide) const {
727   if (log) {
728     if (slide == 0)
729       log->Printf("\t\t%16s [0x%16.16" PRIx64 " - 0x%16.16" PRIx64 ")",
730                   name.AsCString(""), vmaddr + slide, vmaddr + slide + vmsize);
731     else
732       log->Printf("\t\t%16s [0x%16.16" PRIx64 " - 0x%16.16" PRIx64
733                   ") slide = 0x%" PRIx64,
734                   name.AsCString(""), vmaddr + slide, vmaddr + slide + vmsize,
735                   slide);
736   }
737 }
738 
739 const DynamicLoaderDarwin::Segment *
740 DynamicLoaderDarwin::ImageInfo::FindSegment(const ConstString &name) const {
741   const size_t num_segments = segments.size();
742   for (size_t i = 0; i < num_segments; ++i) {
743     if (segments[i].name == name)
744       return &segments[i];
745   }
746   return NULL;
747 }
748 
749 //----------------------------------------------------------------------
750 // Dump an image info structure to the file handle provided.
751 //----------------------------------------------------------------------
752 void DynamicLoaderDarwin::ImageInfo::PutToLog(Log *log) const {
753   if (!log)
754     return;
755   if (address == LLDB_INVALID_ADDRESS) {
756     LLDB_LOG(log, "modtime={0:x+8} uuid={1} path='{2}' (UNLOADED)", mod_date,
757              uuid.GetAsString(), file_spec.GetPath());
758   } else {
759     LLDB_LOG(log, "address={0:x+16} modtime={1:x+8} uuid={2} path='{3}'",
760              address, mod_date, uuid.GetAsString(), file_spec.GetPath());
761     for (uint32_t i = 0; i < segments.size(); ++i)
762       segments[i].PutToLog(log, slide);
763   }
764 }
765 
766 void DynamicLoaderDarwin::PrivateInitialize(Process *process) {
767   DEBUG_PRINTF("DynamicLoaderDarwin::%s() process state = %s\n", __FUNCTION__,
768                StateAsCString(m_process->GetState()));
769   Clear(true);
770   m_process = process;
771   m_process->GetTarget().ClearAllLoadedSections();
772 }
773 
774 //----------------------------------------------------------------------
775 // Member function that gets called when the process state changes.
776 //----------------------------------------------------------------------
777 void DynamicLoaderDarwin::PrivateProcessStateChanged(Process *process,
778                                                      StateType state) {
779   DEBUG_PRINTF("DynamicLoaderDarwin::%s(%s)\n", __FUNCTION__,
780                StateAsCString(state));
781   switch (state) {
782   case eStateConnected:
783   case eStateAttaching:
784   case eStateLaunching:
785   case eStateInvalid:
786   case eStateUnloaded:
787   case eStateExited:
788   case eStateDetached:
789     Clear(false);
790     break;
791 
792   case eStateStopped:
793     // Keep trying find dyld and set our notification breakpoint each time we
794     // stop until we succeed
795     if (!DidSetNotificationBreakpoint() && m_process->IsAlive()) {
796       if (NeedToDoInitialImageFetch())
797         DoInitialImageFetch();
798 
799       SetNotificationBreakpoint();
800     }
801     break;
802 
803   case eStateRunning:
804   case eStateStepping:
805   case eStateCrashed:
806   case eStateSuspended:
807     break;
808   }
809 }
810 
811 ThreadPlanSP
812 DynamicLoaderDarwin::GetStepThroughTrampolinePlan(Thread &thread,
813                                                   bool stop_others) {
814   ThreadPlanSP thread_plan_sp;
815   StackFrame *current_frame = thread.GetStackFrameAtIndex(0).get();
816   const SymbolContext &current_context =
817       current_frame->GetSymbolContext(eSymbolContextSymbol);
818   Symbol *current_symbol = current_context.symbol;
819   Log *log(lldb_private::GetLogIfAllCategoriesSet(LIBLLDB_LOG_STEP));
820   TargetSP target_sp(thread.CalculateTarget());
821 
822   if (current_symbol != NULL) {
823     std::vector<Address> addresses;
824 
825     if (current_symbol->IsTrampoline()) {
826       const ConstString &trampoline_name = current_symbol->GetMangled().GetName(
827           current_symbol->GetLanguage(), Mangled::ePreferMangled);
828 
829       if (trampoline_name) {
830         const ModuleList &images = target_sp->GetImages();
831 
832         SymbolContextList code_symbols;
833         images.FindSymbolsWithNameAndType(trampoline_name, eSymbolTypeCode,
834                                           code_symbols);
835         size_t num_code_symbols = code_symbols.GetSize();
836 
837         if (num_code_symbols > 0) {
838           for (uint32_t i = 0; i < num_code_symbols; i++) {
839             SymbolContext context;
840             AddressRange addr_range;
841             if (code_symbols.GetContextAtIndex(i, context)) {
842               context.GetAddressRange(eSymbolContextEverything, 0, false,
843                                       addr_range);
844               addresses.push_back(addr_range.GetBaseAddress());
845               if (log) {
846                 addr_t load_addr =
847                     addr_range.GetBaseAddress().GetLoadAddress(target_sp.get());
848 
849                 log->Printf("Found a trampoline target symbol at 0x%" PRIx64
850                             ".",
851                             load_addr);
852               }
853             }
854           }
855         }
856 
857         SymbolContextList reexported_symbols;
858         images.FindSymbolsWithNameAndType(
859             trampoline_name, eSymbolTypeReExported, reexported_symbols);
860         size_t num_reexported_symbols = reexported_symbols.GetSize();
861         if (num_reexported_symbols > 0) {
862           for (uint32_t i = 0; i < num_reexported_symbols; i++) {
863             SymbolContext context;
864             if (reexported_symbols.GetContextAtIndex(i, context)) {
865               if (context.symbol) {
866                 Symbol *actual_symbol =
867                     context.symbol->ResolveReExportedSymbol(*target_sp.get());
868                 if (actual_symbol) {
869                   const Address actual_symbol_addr =
870                       actual_symbol->GetAddress();
871                   if (actual_symbol_addr.IsValid()) {
872                     addresses.push_back(actual_symbol_addr);
873                     if (log) {
874                       lldb::addr_t load_addr =
875                           actual_symbol_addr.GetLoadAddress(target_sp.get());
876                       log->Printf(
877                           "Found a re-exported symbol: %s at 0x%" PRIx64 ".",
878                           actual_symbol->GetName().GetCString(), load_addr);
879                     }
880                   }
881                 }
882               }
883             }
884           }
885         }
886 
887         SymbolContextList indirect_symbols;
888         images.FindSymbolsWithNameAndType(trampoline_name, eSymbolTypeResolver,
889                                           indirect_symbols);
890         size_t num_indirect_symbols = indirect_symbols.GetSize();
891         if (num_indirect_symbols > 0) {
892           for (uint32_t i = 0; i < num_indirect_symbols; i++) {
893             SymbolContext context;
894             AddressRange addr_range;
895             if (indirect_symbols.GetContextAtIndex(i, context)) {
896               context.GetAddressRange(eSymbolContextEverything, 0, false,
897                                       addr_range);
898               addresses.push_back(addr_range.GetBaseAddress());
899               if (log) {
900                 addr_t load_addr =
901                     addr_range.GetBaseAddress().GetLoadAddress(target_sp.get());
902 
903                 log->Printf("Found an indirect target symbol at 0x%" PRIx64 ".",
904                             load_addr);
905               }
906             }
907           }
908         }
909       }
910     } else if (current_symbol->GetType() == eSymbolTypeReExported) {
911       // I am not sure we could ever end up stopped AT a re-exported symbol.
912       // But just in case:
913 
914       const Symbol *actual_symbol =
915           current_symbol->ResolveReExportedSymbol(*(target_sp.get()));
916       if (actual_symbol) {
917         Address target_addr(actual_symbol->GetAddress());
918         if (target_addr.IsValid()) {
919           if (log)
920             log->Printf(
921                 "Found a re-exported symbol: %s pointing to: %s at 0x%" PRIx64
922                 ".",
923                 current_symbol->GetName().GetCString(),
924                 actual_symbol->GetName().GetCString(),
925                 target_addr.GetLoadAddress(target_sp.get()));
926           addresses.push_back(target_addr.GetLoadAddress(target_sp.get()));
927         }
928       }
929     }
930 
931     if (addresses.size() > 0) {
932       // First check whether any of the addresses point to Indirect symbols,
933       // and if they do, resolve them:
934       std::vector<lldb::addr_t> load_addrs;
935       for (Address address : addresses) {
936         Symbol *symbol = address.CalculateSymbolContextSymbol();
937         if (symbol && symbol->IsIndirect()) {
938           Status error;
939           Address symbol_address = symbol->GetAddress();
940           addr_t resolved_addr = thread.GetProcess()->ResolveIndirectFunction(
941               &symbol_address, error);
942           if (error.Success()) {
943             load_addrs.push_back(resolved_addr);
944             if (log)
945               log->Printf("ResolveIndirectFunction found resolved target for "
946                           "%s at 0x%" PRIx64 ".",
947                           symbol->GetName().GetCString(), resolved_addr);
948           }
949         } else {
950           load_addrs.push_back(address.GetLoadAddress(target_sp.get()));
951         }
952       }
953       thread_plan_sp.reset(
954           new ThreadPlanRunToAddress(thread, load_addrs, stop_others));
955     }
956   } else {
957     if (log)
958       log->Printf("Could not find symbol for step through.");
959   }
960 
961   return thread_plan_sp;
962 }
963 
964 size_t DynamicLoaderDarwin::FindEquivalentSymbols(
965     lldb_private::Symbol *original_symbol, lldb_private::ModuleList &images,
966     lldb_private::SymbolContextList &equivalent_symbols) {
967   const ConstString &trampoline_name = original_symbol->GetMangled().GetName(
968       original_symbol->GetLanguage(), Mangled::ePreferMangled);
969   if (!trampoline_name)
970     return 0;
971 
972   size_t initial_size = equivalent_symbols.GetSize();
973 
974   static const char *resolver_name_regex = "(_gc|_non_gc|\\$[A-Za-z0-9\\$]+)$";
975   std::string equivalent_regex_buf("^");
976   equivalent_regex_buf.append(trampoline_name.GetCString());
977   equivalent_regex_buf.append(resolver_name_regex);
978 
979   RegularExpression equivalent_name_regex(equivalent_regex_buf);
980   const bool append = true;
981   images.FindSymbolsMatchingRegExAndType(equivalent_name_regex, eSymbolTypeCode,
982                                          equivalent_symbols, append);
983 
984   return equivalent_symbols.GetSize() - initial_size;
985 }
986 
987 lldb::ModuleSP DynamicLoaderDarwin::GetPThreadLibraryModule() {
988   ModuleSP module_sp = m_libpthread_module_wp.lock();
989   if (!module_sp) {
990     SymbolContextList sc_list;
991     ModuleSpec module_spec;
992     module_spec.GetFileSpec().GetFilename().SetCString(
993         "libsystem_pthread.dylib");
994     ModuleList module_list;
995     if (m_process->GetTarget().GetImages().FindModules(module_spec,
996                                                        module_list)) {
997       if (module_list.GetSize() == 1) {
998         module_sp = module_list.GetModuleAtIndex(0);
999         if (module_sp)
1000           m_libpthread_module_wp = module_sp;
1001       }
1002     }
1003   }
1004   return module_sp;
1005 }
1006 
1007 Address DynamicLoaderDarwin::GetPthreadSetSpecificAddress() {
1008   if (!m_pthread_getspecific_addr.IsValid()) {
1009     ModuleSP module_sp = GetPThreadLibraryModule();
1010     if (module_sp) {
1011       lldb_private::SymbolContextList sc_list;
1012       module_sp->FindSymbolsWithNameAndType(ConstString("pthread_getspecific"),
1013                                             eSymbolTypeCode, sc_list);
1014       SymbolContext sc;
1015       if (sc_list.GetContextAtIndex(0, sc)) {
1016         if (sc.symbol)
1017           m_pthread_getspecific_addr = sc.symbol->GetAddress();
1018       }
1019     }
1020   }
1021   return m_pthread_getspecific_addr;
1022 }
1023 
1024 lldb::addr_t
1025 DynamicLoaderDarwin::GetThreadLocalData(const lldb::ModuleSP module_sp,
1026                                         const lldb::ThreadSP thread_sp,
1027                                         lldb::addr_t tls_file_addr) {
1028   if (!thread_sp || !module_sp)
1029     return LLDB_INVALID_ADDRESS;
1030 
1031   std::lock_guard<std::recursive_mutex> guard(m_mutex);
1032 
1033   const uint32_t addr_size = m_process->GetAddressByteSize();
1034   uint8_t buf[sizeof(lldb::addr_t) * 3];
1035 
1036   lldb_private::Address tls_addr;
1037   if (module_sp->ResolveFileAddress(tls_file_addr, tls_addr)) {
1038     Status error;
1039     const size_t tsl_data_size = addr_size * 3;
1040     Target &target = m_process->GetTarget();
1041     if (target.ReadMemory(tls_addr, false, buf, tsl_data_size, error) ==
1042         tsl_data_size) {
1043       const ByteOrder byte_order = m_process->GetByteOrder();
1044       DataExtractor data(buf, sizeof(buf), byte_order, addr_size);
1045       lldb::offset_t offset = addr_size; // Skip the first pointer
1046       const lldb::addr_t pthread_key = data.GetAddress(&offset);
1047       const lldb::addr_t tls_offset = data.GetAddress(&offset);
1048       if (pthread_key != 0) {
1049         // First check to see if we have already figured out the location of
1050         // TLS data for the pthread_key on a specific thread yet. If we have we
1051         // can re-use it since its location will not change unless the process
1052         // execs.
1053         const tid_t tid = thread_sp->GetID();
1054         auto tid_pos = m_tid_to_tls_map.find(tid);
1055         if (tid_pos != m_tid_to_tls_map.end()) {
1056           auto tls_pos = tid_pos->second.find(pthread_key);
1057           if (tls_pos != tid_pos->second.end()) {
1058             return tls_pos->second + tls_offset;
1059           }
1060         }
1061         StackFrameSP frame_sp = thread_sp->GetStackFrameAtIndex(0);
1062         if (frame_sp) {
1063           ClangASTContext *clang_ast_context =
1064               target.GetScratchClangASTContext();
1065 
1066           if (!clang_ast_context)
1067             return LLDB_INVALID_ADDRESS;
1068 
1069           CompilerType clang_void_ptr_type =
1070               clang_ast_context->GetBasicType(eBasicTypeVoid).GetPointerType();
1071           Address pthread_getspecific_addr = GetPthreadSetSpecificAddress();
1072           if (pthread_getspecific_addr.IsValid()) {
1073             EvaluateExpressionOptions options;
1074 
1075             lldb::ThreadPlanSP thread_plan_sp(new ThreadPlanCallFunction(
1076                 *thread_sp, pthread_getspecific_addr, clang_void_ptr_type,
1077                 llvm::ArrayRef<lldb::addr_t>(pthread_key), options));
1078 
1079             DiagnosticManager execution_errors;
1080             ExecutionContext exe_ctx(thread_sp);
1081             lldb::ExpressionResults results = m_process->RunThreadPlan(
1082                 exe_ctx, thread_plan_sp, options, execution_errors);
1083 
1084             if (results == lldb::eExpressionCompleted) {
1085               lldb::ValueObjectSP result_valobj_sp =
1086                   thread_plan_sp->GetReturnValueObject();
1087               if (result_valobj_sp) {
1088                 const lldb::addr_t pthread_key_data =
1089                     result_valobj_sp->GetValueAsUnsigned(0);
1090                 if (pthread_key_data) {
1091                   m_tid_to_tls_map[tid].insert(
1092                       std::make_pair(pthread_key, pthread_key_data));
1093                   return pthread_key_data + tls_offset;
1094                 }
1095               }
1096             }
1097           }
1098         }
1099       }
1100     }
1101   }
1102   return LLDB_INVALID_ADDRESS;
1103 }
1104 
1105 bool DynamicLoaderDarwin::UseDYLDSPI(Process *process) {
1106   Log *log(lldb_private::GetLogIfAnyCategoriesSet(LIBLLDB_LOG_DYNAMIC_LOADER));
1107   bool use_new_spi_interface = false;
1108 
1109   llvm::VersionTuple version = process->GetHostOSVersion();
1110   if (!version.empty()) {
1111     const llvm::Triple::OSType os_type =
1112         process->GetTarget().GetArchitecture().GetTriple().getOS();
1113 
1114     // macOS 10.12 and newer
1115     if (os_type == llvm::Triple::MacOSX &&
1116         version >= llvm::VersionTuple(10, 12))
1117       use_new_spi_interface = true;
1118 
1119     // iOS 10 and newer
1120     if (os_type == llvm::Triple::IOS && version >= llvm::VersionTuple(10))
1121       use_new_spi_interface = true;
1122 
1123     // tvOS 10 and newer
1124     if (os_type == llvm::Triple::TvOS && version >= llvm::VersionTuple(10))
1125       use_new_spi_interface = true;
1126 
1127     // watchOS 3 and newer
1128     if (os_type == llvm::Triple::WatchOS && version >= llvm::VersionTuple(3))
1129       use_new_spi_interface = true;
1130 
1131     // NEED_BRIDGEOS_TRIPLE // Any BridgeOS
1132     // NEED_BRIDGEOS_TRIPLE if (os_type == llvm::Triple::BridgeOS)
1133     // NEED_BRIDGEOS_TRIPLE   use_new_spi_interface = true;
1134   }
1135 
1136   if (log) {
1137     if (use_new_spi_interface)
1138       log->Printf(
1139           "DynamicLoaderDarwin::UseDYLDSPI: Use new DynamicLoader plugin");
1140     else
1141       log->Printf(
1142           "DynamicLoaderDarwin::UseDYLDSPI: Use old DynamicLoader plugin");
1143   }
1144   return use_new_spi_interface;
1145 }
1146